We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 0ada8a7 commit be60f89Copy full SHA for be60f89
tokenizer/src/main/java/edu/illinois/cs/cogcomp/nlp/tokenizer/TokenizerStateMachine.java
@@ -336,7 +336,7 @@ public void process(char token) {
336
if (getCurrent().isAbbr())
337
return; // previous was upper case, acronym and word
338
// continues
339
- else if (Character.isWhitespace(c) && Character.isLowerCase(nextnextChar))
+ else if (Character.isLowerCase(nextnextChar))
340
return; // when the next char is white space and the next next char
341
// is lowercase, we know that the next word is not start of
342
// a sentence, so we continue.
0 commit comments