report_Run6_v2.txt 16.7 KB
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514
********** TRAINING AND TESTING REPORT **********
Training file: training-data-set-70_v4.txt

best params:{'c1': 0.2615074589465166, 'c2': 0.00276705652339924}
best CV score:0.816301419715609
model size: 0.07M

Flat F1: 0.8270102352867752
             precision    recall  f1-score   support

         OD      0.652     0.405     0.500        37
         pH      1.000     1.000     1.000        12
  Technique      0.957     1.000     0.978        22
        Med      1.000     0.912     0.954        57
       Temp      0.818     1.000     0.900        18
       Vess      0.000     0.000     0.000         0
       Agit      0.000     0.000     0.000         0
      Phase      1.000     0.895     0.944        19
        Air      0.810     0.758     0.783        62
       Anti      1.000     1.000     1.000         9
     Strain      1.000     1.000     1.000         1
      Gtype      0.845     0.877     0.861       106
  Substrain      0.000     0.000     0.000         1
       Supp      0.881     0.706     0.784       136
   Gversion      0.000     0.000     0.000         0

avg / total      0.870     0.796     0.827       480


Top likely transitions:
Agit   -> Agit    6.901670
OD     -> OD      6.662115
Temp   -> Temp    5.932826
Med    -> Med     5.616057
Supp   -> Supp    4.930556
Air    -> Air     4.771871
Anti   -> Anti    4.504604
Gversion -> Gversion 4.501000
Phase  -> Phase   4.124266
Technique -> Technique 4.076096
Gtype  -> Gtype   3.973576
O      -> O       3.951466
pH     -> pH      2.018763
O      -> Supp    1.197390
O      -> Technique 1.079203
Gtype  -> Supp    1.043942
Air    -> O       0.963896
Supp   -> O       0.612092
Substrain -> Gtype   0.476807
O      -> Gtype   0.437647
Med    -> O       0.335890
Phase  -> O       0.267800
OD     -> Phase   0.245045
Temp   -> O       0.202449
O      -> Anti    0.134070
Technique -> Air     0.008370
O      -> Temp    0.000020
OD     -> Air     -0.031556
Gtype  -> OD      -0.047613
Phase  -> OD      -0.296269
Gtype  -> O       -0.463165
OD     -> O       -0.559048
Technique -> O       -0.753141
O      -> Air     -0.928594
Agit   -> O       -1.028076
Med    -> Supp    -1.262808
Substrain -> O       -1.295585


Top unlikely transitions:
Agit   -> Agit    6.901670
OD     -> OD      6.662115
Temp   -> Temp    5.932826
Med    -> Med     5.616057
Supp   -> Supp    4.930556
Air    -> Air     4.771871
Anti   -> Anti    4.504604
Gversion -> Gversion 4.501000
Phase  -> Phase   4.124266
Technique -> Technique 4.076096
Gtype  -> Gtype   3.973576
O      -> O       3.951466
pH     -> pH      2.018763
O      -> Supp    1.197390
O      -> Technique 1.079203
Gtype  -> Supp    1.043942
Air    -> O       0.963896
Supp   -> O       0.612092
Substrain -> Gtype   0.476807
O      -> Gtype   0.437647
Med    -> O       0.335890
Phase  -> O       0.267800
OD     -> Phase   0.245045
Temp   -> O       0.202449
O      -> Anti    0.134070
Technique -> Air     0.008370
O      -> Temp    0.000020
OD     -> Air     -0.031556
Gtype  -> OD      -0.047613
Phase  -> OD      -0.296269
Gtype  -> O       -0.463165
OD     -> O       -0.559048
Technique -> O       -0.753141
O      -> Air     -0.928594
Agit   -> O       -1.028076
Med    -> Supp    -1.262808
Substrain -> O       -1.295585


Top positive:
7.812637 O        b'lemma:1'
6.504281 O        b'lemma:3'
6.400430 O        b'word[:2]:re'
6.304930 Technique b'word[:2]:Ch'
6.279826 Air      b'word[:2]:Ae'
5.852043 O        b'lemma:2'
5.816867 O        b'-2:lemma:_'
5.295700 Anti     b'-2:lemma:antibody'
5.063616 Phase    b'lemma:stationary'
4.995551 Air      b'lemma:anaerobic'
4.918388 O        b'lemma:a'
4.801031 O        b'+2:lemma:\xc2\xb0c'
4.623525 O        b'postag:IN'
4.395080 Gtype    b'-1:lemma:\xe2\x88\x86'
4.294827 Phase    b'lemma:mid-log'
4.288438 Gtype    b'-2:lemma:genotype/variation'
4.244795 Technique b'word[:2]:RN'
4.131863 O        b'postag::'
4.115454 Temp     b'-1:lemma:sample'
3.937161 O        b'+2:lemma:cra'
3.620368 O        b'lemma:.'
3.620368 O        b'postag:.'
3.598727 Gtype    b'lemma:type'
3.598727 Gtype    b'word[:2]:ty'
3.574166 Gtype    b'word[:1]:\xce\x94'
3.565566 Gtype    b'word[:2]:Fl'
3.545115 O        b'word[:1]:S'
3.473665 O        b'word[:1]:G'
3.465522 Med      b'word[:2]:LB'
3.406689 O        b'-1:lemma:tag'
3.343307 O        b'word[:2]:ge'
3.313070 O        b'postag:VBN'
3.293280 Supp     b'lemma:nitrate'
3.293280 Supp     b'word[:2]:ni'
3.264010 O        b'+2:lemma:fructose'
3.240524 O        b'+1:postag:RB'
3.140733 Supp     b'lemma:arginine'
3.120877 O        b'word[:1]:B'
3.061754 Air      b'word[:2]:An'
3.016856 Supp     b'+1:lemma:1'
2.979008 OD       b'word[:2]:OD'
2.975113 O        b'word[:2]:Rp'
2.916749 Supp     b'+1:lemma:\xc2\xb5m'
2.856866 Supp     b'word[:1]:I'
2.771072 Temp     b'word[:1]:3'
2.740905 Anti     b'+1:lemma:antibody'
2.679770 O        b'lemma:_'
2.679770 O        b'word[:1]:_'
2.661062 Med      b'word[:1]:M'
2.651438 Supp     b'-2:lemma:shake'
2.637158 Supp     b'+1:lemma:2'
2.593344 Med      b'lemma:MOPS'
2.593344 Med      b'word[:2]:MO'
2.551429 O        b'postag:DT'
2.548355 O        b'+1:postag:VBP'
2.546726 Gtype    b'-2:lemma:delta'
2.530641 Anti     b'+2:lemma:antibody'
2.523357 Supp     b'lemma:Iron'
2.523357 Supp     b'word[:2]:Ir'
2.523357 Supp     b'-2:lemma:Anaerobic'
2.503256 Gtype    b'word[:1]:d'
2.469925 OD       b'word[:1]:O'
2.458839 O        b'word[:2]:Cr'
2.448696 O        b'-1:lemma:Aerobic'
2.435690 Med      b'+2:lemma:with'
2.412032 Supp     b'word[:2]:Fe'
2.383646 O        b'+2:lemma:chipseq'
2.330968 O        b'postag:CC'
2.321337 O        b'lemma:purr'
2.315130 Phase    b'-2:lemma:phase'
2.313990 Air      b'word[:1]:A'
2.307788 Air      b'-1:lemma:co2'
2.270559 Gtype    b'lemma:nsrr'
2.270559 Gtype    b'word[:2]:Ns'
2.230916 O        b'-2:lemma:medium'
2.219186 O        b'lemma:b'
2.212270 O        b'lemma:rpob'
2.211847 Supp     b'lemma:acetate'
2.208823 Gtype    b'-1:lemma:rpob'
2.193351 Gtype    b'+2:lemma:glucose'
2.188714 Supp     b'-2:lemma:purr'
2.167125 Substrain b'lemma:mg1655'
2.167125 Substrain b'word[:2]:MG'
2.162173 Supp     b'-2:lemma:Lrp'
2.153258 pH       b'lemma:ph5'
2.153258 pH       b'+1:lemma:.5'
2.127429 Gversion b'lemma:chip-seq'
2.119617 O        b'-1:lemma:anaerobic'
2.097711 Gtype    b'+1:lemma:type'
2.093597 Gtype    b'lemma:\xe2\x88\x86'
2.093597 Gtype    b'word[:1]:\xe2\x88\x86'
2.073634 Med      b'word[:1]:L'
2.067738 Substrain b'word[:1]:M'
2.066496 Temp     b'+1:lemma:\xc2\xb0c'
2.028277 O        b'word[:2]:Lr'
1.996518 O        b'word[:1]:-'
1.987484 O        b'-1:lemma:media'
1.972620 pH       b'+1:postag:CD'
1.963565 Supp     b'+1:lemma:_'
1.929849 O        b'word[:2]:Cu'
1.926238 Gtype    b'word[:1]:W'
1.923997 O        b'-1:lemma:glucose'
1.920206 Supp     b'-1:lemma:Cra'
1.885222 Supp     b'+2:lemma:rifampicin'
1.838859 Temp     b'-1:lemma:\xcf\x8332'
1.835835 O        b'-1:lemma:lb'
1.834634 O        b'word[:2]:ch'
1.831989 O        b'-2:lemma:myc'
1.820007 Supp     b'-1:lemma:with'
1.819919 Supp     b'word[:2]:gl'
1.813003 Strain   b'lemma:k-12'
1.813003 Strain   b'word[:2]:K-'
1.800422 O        b'+1:lemma:od600'
1.786685 Supp     b'lemma:pq'
1.786685 Supp     b'word[:2]:PQ'
1.786098 Supp     b'-2:lemma:supplement'
1.773090 O        b'lemma:argr'
1.754463 Supp     b'-1:postag:CC'
1.752010 Temp     b'lemma:43'
1.752010 Temp     b'word[:2]:43'
1.748609 Gtype    b'-2:lemma:genotype'
1.713554 Supp     b'word[:1]:N'
1.705522 Med      b'+1:lemma:0.4'
1.705477 Gtype    b'-2:postag:DT'
1.699311 O        b'lemma:with'
1.697768 Temp     b'-2:lemma:\xcf\x8332'
1.696162 Supp     b'word[:1]:\xc2\xb5'
1.684853 Supp     b'+2:lemma:for'
1.669736 Med      b'+2:lemma:b2'
1.659149 Strain   b'word[:1]:K'
1.656653 O        b'lemma:A'
1.642261 Gtype    b'+1:lemma:with'
1.639045 O        b'-1:lemma:0.3'
1.637590 O        b'-1:lemma:type'
1.629911 Agit     b'-2:postag:IN'
1.626799 Supp     b'lemma:fructose'
1.598539 Gtype    b'word[:2]:cr'
1.562458 Air      b'+2:lemma:37'
1.560840 O        b'+1:postag:NNP'
1.545322 O        b'+1:lemma:nacl'
1.535808 Air      b'postag:RB'
1.534546 pH       b'word[:2]:pH'
1.526850 Air      b'word[:2]:an'
1.494453 Supp     b'+1:lemma:hour'
1.493417 Gtype    b'hGreek'
1.485107 Gtype    b'lemma:wt'
1.475865 O        b'lemma:Nac'
1.465086 O        b'-2:lemma:~'
1.460815 O        b'postag:VBD'
1.455969 OD       b'+1:lemma:stationary'
1.446469 Air      b'-2:postag:CD'
1.436964 O        b'word[:1]:c'
1.435630 Technique b'word[:1]:R'
1.424956 Temp     b'-1:lemma:43'
1.424148 Gtype    b'+1:lemma:flagtag'
1.422205 OD       b'word[:2]:0.'
1.409582 Gtype    b'postag:JJ'
1.404450 O        b'word[:1]:R'
1.388050 Gversion b'lemma:nc'
1.388050 Gversion b'word[:2]:NC'
1.382998 O        b'-2:lemma:co2'
1.376458 O        b'+1:lemma:chip-seq'
1.376458 O        b'word[:2]:In'
1.373329 Anti     b'word[:2]:an'
1.361226 Gtype    b'lemma:arca8myc'
1.361226 Gtype    b'-2:lemma:chip-arca'
1.348605 O        b'word[:1]:E'
1.340934 Supp     b'lemma:dpd'
1.340934 Supp     b'word[:2]:DP'
1.336435 O        b'+1:postag::'
1.336267 O        b'+1:postag:VBZ'
1.332234 O        b'word[:2]:fo'
1.326668 Gversion b'word[:2]:Ch'
1.308053 Gtype    b'-1:lemma:_'
1.306772 Supp     b'-1:lemma:+'
1.299920 O        b'+2:postag:JJ'
1.288650 Supp     b'lemma:rifampicin'
1.282895 OD       b'word[:1]:0'
1.279050 Air      b'word[:1]:a'
1.278342 Supp     b'word[:2]:ri'
1.276274 Air      b'-1:lemma:ChIP-Seq'
1.270749 Air      b'-2:lemma:IP'
1.268696 Gtype    b'word[:1]:F'
1.267720 Air      b'-2:lemma:%'
1.250226 Vess     b'lemma:flask'
1.250226 Vess     b'-1:lemma:warm'
1.250226 Vess     b'word[:2]:fl'
1.250226 Vess     b'-2:lemma:pre'
1.250226 Vess     b'+2:lemma:43'
1.248294 Technique b'-1:postag:CD'
1.241744 Med      b'+1:lemma:minimal'
1.240037 Supp     b'-2:lemma:for'
1.238645 O        b'word[:2]:or'
1.231304 Gversion b'-2:postag:VB'
1.230809 O        b'lemma:Custom'
1.221416 Supp     b'lemma:no3'
1.221416 Supp     b'word[:2]:NO'
1.208975 O        b'lemma:-'
1.208565 Supp     b'-1:postag:CD'
1.196345 Gtype    b'-2:postag:NNS'


Top negative:
-0.020651 Vess     b'hLower'
-0.021405 Gtype    b'word[:1]:g'
-0.022102 Temp     b'hGreek'
-0.023747 Air      b'-1:lemma:or'
-0.024998 O        b'+1:lemma:phase'
-0.026006 O        b'-1:lemma:of'
-0.026445 Technique b'lemma:chip-seq'
-0.027849 O        b'-1:lemma:the'
-0.028545 O        b'-1:lemma:-lrb-'
-0.028751 O        b'+1:postag:CD'
-0.029296 O        b'+1:lemma:-rrb-'
-0.033680 O        b'lemma:150'
-0.033680 O        b'+1:lemma:mg/ml'
-0.033680 O        b'word[:2]:15'
-0.033680 O        b'-2:lemma:concentration'
-0.033737 Supp     b'hGreek'
-0.037022 OD       b'+1:postag:CD'
-0.037317 O        b'-1:lemma:g/l'
-0.040115 Supp     b'+2:postag:NNS'
-0.040221 O        b'+1:lemma:supplement'
-0.040832 O        b'-2:lemma:of'
-0.040980 OD       b'postag:JJ'
-0.042683 O        b'-1:lemma:rifampicin'
-0.044489 Phase    b'+1:postag:NN'
-0.045601 O        b'+1:lemma:-lrb-'
-0.046663 O        b'word[:1]:p'
-0.050360 Supp     b'-2:postag:NN'
-0.052075 Air      b'postag:-RRB-'
-0.052075 Air      b'word[:2]:-R'
-0.055278 O        b'+1:lemma:95'
-0.056644 O        b'word[:2]:an'
-0.056812 O        b'word[:2]:WT'
-0.058247 Air      b'lemma:-rrb-'
-0.058272 Temp     b'postag:NN'
-0.060275 Supp     b'-1:postag:NN'
-0.068834 O        b'word[:1]:g'
-0.075194 O        b'lemma:0.1'
-0.075978 O        b'+1:lemma:300'
-0.078371 Med      b'-2:postag:NNP'
-0.085484 O        b'-1:lemma:mm'
-0.090665 Med      b'postag:NN'
-0.095552 Anti     b'symb'
-0.097859 O        b'-1:lemma:IP'
-0.098451 Gtype    b'postag:NNP'
-0.098891 O        b'+2:lemma:iptg'
-0.099213 O        b'+2:lemma:anaerobically'
-0.100378 O        b'-1:postag:-LRB-'
-0.100648 Air      b'-1:postag:CC'
-0.102134 Phase    b'-2:postag:NN'
-0.104356 O        b'-2:lemma:30'
-0.104398 O        b'-2:lemma:aerobically'
-0.104525 O        b'-2:postag:-LRB-'
-0.112855 O        b'-1:postag:VBN'
-0.129315 pH       b'postag:NN'
-0.130801 O        b'lemma:dissolve'
-0.130801 O        b'+2:lemma:methanol'
-0.132204 Gversion b'-1:postag:NN'
-0.135249 O        b'+2:lemma:-rrb-'
-0.136494 Temp     b'-2:postag:NN'
-0.140087 Air      b'postag:CC'
-0.143197 Anti     b'+1:postag:JJ'
-0.145931 O        b'lemma:dpd'
-0.145931 O        b'word[:2]:DP'
-0.146304 O        b'+1:lemma:minimal'
-0.149480 O        b'+2:lemma:mg1655'
-0.153199 O        b'lemma:glucose'
-0.156279 O        b'word[:2]:OD'
-0.167599 O        b'-2:lemma:anaerobically'
-0.169441 O        b'+2:lemma:.'
-0.169441 O        b'+2:postag:.'
-0.176081 O        b'-2:lemma:and'
-0.176601 O        b'word[:2]:gl'
-0.178983 O        b'word[:2]:30'
-0.182343 Supp     b'-2:lemma:-lrb-'
-0.182989 Gtype    b'+2:lemma:,'
-0.182989 Gtype    b'+2:postag:,'
-0.187940 O        b'-2:postag:RB'
-0.188522 Gtype    b'-1:postag:NN'
-0.193161 Supp     b'-2:postag:-LRB-'
-0.195209 O        b'+1:postag:VBG'
-0.195524 Gtype    b'-1:lemma:,'
-0.195524 Gtype    b'-1:postag:,'
-0.196160 O        b'-2:postag:-RRB-'
-0.205382 O        b'lemma:media'
-0.205997 O        b'+1:lemma:+'
-0.207188 O        b'-2:postag:VBG'
-0.214958 O        b'-1:postag:IN'
-0.216865 O        b'+2:lemma:fnr'
-0.220433 O        b'-1:lemma:iptg'
-0.225687 OD       b'+2:postag:CD'
-0.226895 Anti     b'+1:lemma:anti-fur'
-0.227678 O        b'+1:lemma:hour'
-0.227891 O        b'+1:lemma:\xc2\xb0c'
-0.233240 O        b'+1:postag:-RRB-'
-0.234954 O        b'+1:lemma:until'
-0.238139 O        b'lemma:2h'
-0.238139 O        b'-1:lemma:additional'
-0.238139 O        b'word[:2]:2h'
-0.240394 Med      b'-2:lemma:grow'
-0.240644 O        b'+1:lemma:cell'
-0.240717 O        b'lemma:20'
-0.241598 Air      b'+1:postag:JJ'
-0.243020 Air      b'+2:postag:IN'
-0.249072 O        b'+1:lemma:.'
-0.249072 O        b'+1:postag:.'
-0.270838 O        b'lemma:aerobically'
-0.270838 O        b'word[:2]:ae'
-0.272076 O        b'-2:lemma:IP'
-0.276552 Anti     b'+2:postag:JJ'
-0.282858 O        b'word[:2]:mg'
-0.291041 O        b'+1:lemma:_'
-0.299542 O        b'-2:postag:DT'
-0.314381 O        b'word[:1]:F'
-0.315135 O        b'+2:lemma:medium'
-0.316365 O        b'lemma:k-12'
-0.316365 O        b'word[:2]:K-'
-0.323941 O        b'-1:lemma:rpob'
-0.324142 O        b'+1:lemma:g/l'
-0.324651 OD       b'-2:postag:JJ'
-0.330410 Med      b'+1:postag:NN'
-0.337573 O        b'lemma:anaerobically'
-0.342544 O        b'word[:2]:ri'
-0.349990 Supp     b'+2:lemma:-rrb-'
-0.361823 O        b'-1:lemma:mid-log'
-0.376409 O        b'-1:lemma:nsrr'
-0.377222 Anti     b'+2:lemma:polyclonal'
-0.377621 O        b'-1:lemma:grow'
-0.387403 O        b'-2:lemma:rpob'
-0.393536 O        b'-1:lemma:37'
-0.397261 Supp     b'+2:postag:-RRB-'
-0.408344 O        b'word[:1]:K'
-0.411343 O        b'-1:lemma:0.2'
-0.413533 O        b'lemma:phase'
-0.415095 O        b'word[:2]:Fe'
-0.418603 Supp     b'-2:postag:JJ'
-0.422914 O        b'lemma:rifampicin'
-0.425448 O        b'-2:lemma:a'
-0.436504 O        b'-2:lemma::'
-0.440069 Med      b'-1:postag:NN'
-0.450178 Supp     b'+2:lemma:2'
-0.452858 O        b'lemma:of'
-0.452858 O        b'word[:2]:of'
-0.456778 Supp     b'lemma:2'
-0.464475 Agit     b'symb'
-0.477506 Supp     b'+2:postag:NN'
-0.480481 O        b'word[:2]:0.'
-0.484144 O        b'+2:lemma:rifampicin'
-0.495023 OD       b'+1:postag:NN'
-0.495729 O        b'lemma:methanol'
-0.495729 O        b'-2:lemma:dissolve'
-0.498568 O        b'-1:lemma:dissolve'
-0.498568 O        b'+1:lemma:methanol'
-0.501386 O        b'postag:RB'
-0.501736 O        b'-2:lemma:50'
-0.505561 Agit     b'hUpper'
-0.505561 Agit     b'hLower'
-0.507205 O        b'+1:postag:NNS'
-0.510498 O        b'+2:postag:-RRB-'
-0.539348 O        b'+2:postag:RB'
-0.550860 O        b'word[:1]:0'
-0.576925 Med      b'+1:postag:IN'
-0.579947 O        b'lemma:mid-log'
-0.589847 O        b'word[:1]:d'
-0.639331 Phase    b'hUpper'
-0.639331 Phase    b'hLower'
-0.644727 O        b'+1:postag:IN'
-0.678795 Med      b'symb'
-0.717017 Med      b'-2:postag:VBN'
-0.751995 Supp     b'word[:2]:an'
-0.759518 O        b'-1:lemma:co2'
-0.776028 O        b'-1:postag:VBG'
-0.792743 O        b'-2:lemma:supplement'
-0.794523 O        b'word[:2]:me'
-0.883371 O        b'word[:2]:ce'
-0.883506 O        b'lemma:wt'
-0.888247 O        b'+2:lemma:mid-log'
-0.920374 O        b'word[:2]:Ch'
-0.968528 O        b'word[:1]:N'
-1.043344 O        b'-2:lemma:rifampicin'
-1.053670 Gtype    b'word[:1]:C'
-1.081691 Supp     b'symb'
-1.097239 O        b'word[:1]:\xce\x94'
-1.146299 Air      b'-1:postag:JJ'
-1.205559 O        b'-2:lemma:phase'
-1.226939 Phase    b'postag:JJ'
-1.279089 O        b'-1:postag::'
-1.306934 O        b'word[:1]:P'
-1.435763 Air      b'postag:NN'
-1.552893 Supp     b'postag:JJ'
-1.656010 O        b'+1:lemma:in'
-1.838496 O        b'-1:lemma:2'
-1.866172 Technique b'postag:NN'
-2.005093 O        b'+1:lemma:at'
-2.021343 Anti     b'postag:NNP'
-2.209344 Supp     b'+2:postag:CD'
-2.425446 O        b'+1:lemma:2'
-2.700819 O        b'+1:lemma:1'
-2.961178 OD       b'word[:1]:-'
-3.613008 O        b'-1:lemma::'
-5.053367 O        b'-1:lemma:_'