Carlos-Francisco Méndez-Cruz

New terminological tagging for CRFs

...@@ -142,7 +142,9 @@ if __name__ == "__main__": ...@@ -142,7 +142,9 @@ if __name__ == "__main__":
142 if word in hashTerms[termTag]: 142 if word in hashTerms[termTag]:
143 if word.find('-') > -1: 143 if word.find('-') > -1:
144 found = False 144 found = False
145 - for i in range(word.count('-')): 145 + repetitions = word.count('-')
146 + print("repetitions: {}".format(repetitions))
147 + for i in range(1, repetitions):
146 wordOrig = word.replace('-', ' ', 1) 148 wordOrig = word.replace('-', ' ', 1)
147 #print("Word: {}".format(word)) 149 #print("Word: {}".format(word))
148 if wordOrig in hashTermsOrig[termTag]: 150 if wordOrig in hashTermsOrig[termTag]:
......