Kevin Meza Landeros

Extraccion de infomacion DISEASES BD

1 +# ENFERMEDADES MONOGENICAS
2 +# Equipo 5
3 +
4 +# Filtramos aquellas enfermedades de nustro interes
5 +cat human_disease_textmining_full.tsv | grep 'DOID:0050177' > DOID_filter/monogenic_diseases.tsv
6 +cat human_disease_textmining_full.tsv | grep 'DOID:0050735' > DOID_filter/x_linked_monogenic_diseases.tsv
7 +cat human_disease_textmining_full.tsv | grep 'DOID:0050738' > DOID_filter/y_linked_monogenic_diseases.tsv
8 +cat human_disease_textmining_full.tsv | grep 'DOID:0050739' > DOID_filter/autosomal_monogenic_diseases.tsv
9 +
10 +# Agrupar todas las enfermedades monogénicas
11 +cd DOID_filter
12 +cat autosomal_monogenic_diseases.tsv monogenic_diseases.tsv x_linked_monogenic_diseases.tsv y_linked_monogenic_diseases.tsv > merge_monogenic_diseases.tsv
13 +
14 +# Cramos una lista de los genes asociados a enfermedades monogenicas
15 +cat merge_monogenic_diseases.tsv | cut -f1 > merge_list_monogenic_diseases.tsv
16 +
17 +# Recuperamos la anotacion de Ensembl para cada uno de los genes de interes
18 +grep -f merge_list_monogenic_diseases.tsv ../mart_export.txt > ../match.tsv