Skip to content

Commit cea42b8

Browse files
committed
Update other possible places where characterMap is queried with text that might have repeated whitespace
1 parent 79c4e3f commit cea42b8

File tree

3 files changed

+5
-2
lines changed

3 files changed

+5
-2
lines changed

src/edu/stanford/nlp/quoteattribution/Sieves/MSSieves/BaselineTopSpeakerSieve.java

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -153,7 +153,8 @@ public Person.Gender getGender(MentionData mention) {
153153
gender = genderList.get(mentionText);
154154
}
155155
} else if(mention.type != null && mention.type.equals("name")) {
156-
gender = characterMap.get(mention.text).get(0).gender;
156+
String mentionText = mention.text.replaceAll("\\s+", " ");
157+
gender = characterMap.get(mentionText).get(0).gender;
157158
}
158159
return gender;
159160
}

src/edu/stanford/nlp/quoteattribution/Sieves/MSSieves/MajoritySpeakerSieve.java

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -28,6 +28,7 @@ public Counter<String> getTopSpeakerList() {
2828
ArrayList<String> names = scanForNames(new Pair<>(0, doc.get(CoreAnnotations.TokensAnnotation.class).size() - 1)).first;
2929

3030
for(String name : names) {
31+
name = name.replaceAll("\\s+", " ");
3132
characters.incrementCount(characterMap.get(name).get(0).name);
3233
}
3334
return characters;

src/edu/stanford/nlp/quoteattribution/Sieves/QMSieves/OneNameSentenceSieve.java

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -44,7 +44,8 @@ public void oneNameSentence(Annotation doc) {
4444

4545
ArrayList<Integer> pronounsIndices = scanForPronouns(range);
4646
if (names.size() == 1) {
47-
List<Person> p = characterMap.get(names.get(0));
47+
String name = names.get(0).replaceAll("\\s+", " ");
48+
List<Person> p = characterMap.get(name);
4849

4950
//guess if exactly one name
5051
if (p.size() == 1 && pronounsIndices.size() == 0) {

0 commit comments

Comments
 (0)