Carlos-Francisco Méndez-Cruz

Training, crossvalidation and testing structural domain dataset

......@@ -43,7 +43,7 @@ __author__ = 'CMendezC'
# Execution:
# python training-crossvalidation-testing-binding-thrombin.py
# python training-crossvalidation-testing-dom.py
# --inputPath /home/compu2/bionlp/lcg-bioinfoI-bionlp/clasificacion-automatica/structural-domain-dataset
# --inputTrainingData trainData.txt
# --inputTrainingClasses trainClasses.txt
......@@ -60,7 +60,7 @@ __author__ = 'CMendezC'
# --removeStopWords
# source activate python3
# python training-crossvalidation-testing-binding-thrombin.py
# python training-crossvalidation-testing-dom.py
# --inputPath /home/compu2/bionlp/lcg-bioinfoI-bionlp/clasificacion-automatica/structural-domain-dataset
# --inputTrainingData trainData.txt
# --inputTrainingClasses trainClasses.txt
......@@ -75,7 +75,7 @@ __author__ = 'CMendezC'
# --kernel linear
# --reduction SVD200
# --removeStopWords
# python training-crossvalidation-testing-binding-thrombin.py --inputPath /home/compu2/bionlp/lcg-bioinfoI-bionlp/clasificacion-automatica/structural-domain-dataset --inputTrainingData trainData.txt --inputTrainingClasses trainClasses.txt --inputTestingData testData.txt --inputTestingClasses testClasses.txt --outputModelPath /home/compu2/bionlp/lcg-bioinfoI-bionlp/clasificacion-automatica/structural-domain-dataset/models --outputModelFile SVM-lineal-model.mod --outputReportPath /home/compu2/bionlp/lcg-bioinfoI-bionlp/clasificacion-automatica/structural-domain-dataset/reports --outputReportFile SVM-lineal.txt --classifier SVM --kernel linear
# python training-crossvalidation-testing-dom.py --inputPath /home/compu2/bionlp/lcg-bioinfoI-bionlp/clasificacion-automatica/structural-domain-dataset --inputTrainingData trainData.txt --inputTrainingClasses trainClasses.txt --inputTestingData testData.txt --inputTestingClasses testClasses.txt --outputModelPath /home/compu2/bionlp/lcg-bioinfoI-bionlp/clasificacion-automatica/structural-domain-dataset/models --outputModelFile SVM-lineal-model.mod --outputReportPath /home/compu2/bionlp/lcg-bioinfoI-bionlp/clasificacion-automatica/structural-domain-dataset/reports --outputReportFile SVM-lineal.txt --classifier SVM --kernel linear
# --reduction SVD200
# --removeStopWords
......@@ -85,7 +85,7 @@ __author__ = 'CMendezC'
if __name__ == "__main__":
# Parameter definition
parser = argparse.ArgumentParser(description='Training validation Binding Thrombin Dataset.')
parser = argparse.ArgumentParser(description='Training validation structural domain dataset.')
parser.add_argument("--inputPath", dest="inputPath",
help="Path to read input files", metavar="PATH")
parser.add_argument("--inputTrainingData", dest="inputTrainingData",
......@@ -115,7 +115,7 @@ if __name__ == "__main__":
parser.add_argument("--reduction", dest="reduction",
help="Feature selection or dimensionality reduction", metavar="NAME",
choices=('SVD200', 'SVD300', 'CHI250', 'CHI2100'), default='SVD200')
parser.add_option("--removeStopWords", default=False,
parser.add_argument("--removeStopWords", default=False,
action="store_true", dest="removeStopWords",
help="Remove stop words")
......