We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 088f046 commit f44acf3Copy full SHA for f44acf3
data.py
@@ -5,8 +5,6 @@
5
import torch
6
import re
7
8
-#from nltk import sent_tokenize
9
-
10
re_sentend = re.compile(r'(?<!\b[A-Z]\.)(?<!\b[Mm]rs\.)(?<!\b[MmDdSsJj]r\.)(?<=[\.\?\!])[ \n\t](?!["\'])|(?<!\b[A-Z]\.)(?<!\b[Mm]rs\.)(?<!\b[MmDdSsJj]r\.)(?<=[\.\?\!] ["\'])[ \n\t]+')
11
12
def sent_tokenize(instr):
0 commit comments