test_mapping.py
1.63 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
import pandas as pd
import format_fun
import mapping_fun
ex_dic = {"GSE": ["GSEnnn", "GSEnnn", "GSEnnn"],
"GSM": ["GSMnnn", "GSMnnn", "GSMnnn"],
"GPL_PMID": ["GPLnnn-PMID:nnn","GPLnnn-PMID:nnn","GPLnnn-PMID:nnn"],
"BANGLINE": ["growth_protocol_ch1.1", "growth_protocol_ch1.1", "growth_protocol_ch1.1"],
"FULLTEXT": ["Loreum loreum <tag> loreum 37 </tag>","Loreum loreum <tag> loreum 37 </tag>","Loreum loreum <tag> loreum 37 </tag>"],
"TERM_NAME": ["loreum 37","loreum 37","loreum 37"],
"TERM_TYPE": ["exTag Type", "exTag Type", "exTag Type"]
}
npl_df = pd.DataFrame(data=ex_dic)
ex_dic = {"TERM_ID": ["MCOnnnn", "MCOnnnn", "MCOnnnn"],
"TERM_CLASS_ID": ["XXXnnnn", "XXXnnnn", "XXXnnnn"],
"TERM_CLASS_PARENT_ID": ["XXXnnnn","XXXnnnn","XXXnnnn"],
"TERM_NAME": ["loreum 37","loreum 37","loreum 37"],
"TERM_DESCRIPTION": ["Loreum loreum","Loreum loreum","Loreum loreum"],
"TERM_HEAD": ["Loreum loreum", "Loreum loreum", "Loreum loreum"],
}
mco_df = pd.DataFrame(data=ex_dic)
ex_dic = {"TERM_ID": ["MCOnnnn", "MCOnnnn", "MCOnnnn"],
"GC_ID": ["MCOnnnn", "MCOnnnn", "MCOnnnn"],
"TERM_TYPE": ["exTag Type", "exTag Type", "exTag Type"],
"TERM_ORDER": ["Loreum", "Loreum", "Loreum"],
}
mco_links = pd.DataFrame(data=ex_dic)
mapping_fun.str_match_map_mco(npl_df, mco_df, mco_links = None, min_match=None)
mapping_fun.str_match_map_mco(npl_df, mco_df, mco_links = None, min_match=2)
mapping_fun.raw_map_mco(npl_df, mco_df, mco_links = None)
mapping_fun.raw_map_mco(npl_df, mco_df, mco_links = mco_links)