diff --git a/src/segmenter.py b/src/segmenter.py index f1cee99..454006c 100644 --- a/src/segmenter.py +++ b/src/segmenter.py @@ -20,8 +20,8 @@ def __init__(self,file_obj): file = open(self.f_name,'r') def get_segments(self, input_text): - "Simple segementer spliting texts based on regex." - return re.split("[.!?]",input_text) + """Simple segmenter splitting texts based on regex while handling decimal points and abbreviations.""" + return re.split(r'(?