Carlos-Francisco Méndez-Cruz

New terminological tagging for CRFs

...@@ -158,6 +158,7 @@ if __name__ == "__main__": ...@@ -158,6 +158,7 @@ if __name__ == "__main__":
158 break 158 break
159 #print("Line: {}".format(line)) 159 #print("Line: {}".format(line))
160 if not found: 160 if not found:
161 + wordOrig = word
161 for i in range(repetitions, 0, -1): 162 for i in range(repetitions, 0, -1):
162 wordOrig = wordOrig.replace('-', ' ', 1) 163 wordOrig = wordOrig.replace('-', ' ', 1)
163 print("Word: {}".format(wordOrig)) 164 print("Word: {}".format(wordOrig))
...@@ -171,8 +172,8 @@ if __name__ == "__main__": ...@@ -171,8 +172,8 @@ if __name__ == "__main__":
171 line = line.rstrip('\n') 172 line = line.rstrip('\n')
172 break 173 break
173 if not found: 174 if not found:
174 - for i in range(0, repetitions): 175 + for i in range(1, repetitions + 1):
175 - wordOrig = word.replace('-', ' ', 1) 176 + wordOrig = word.replace('-', ' ', i)
176 print("Word: {}".format(wordOrig)) 177 print("Word: {}".format(wordOrig))
177 if wordOrig in hashTermsOrig[termTag]: 178 if wordOrig in hashTermsOrig[termTag]:
178 print("WordOrig: {}".format(wordOrig)) 179 print("WordOrig: {}".format(wordOrig))
......