Spaces:
Sleeping
Sleeping
#Representation name (used for naming output files): | |
representation_name: AAC | |
#representation_name: LEARNED-VEC | |
#representation_name: T5 | |
#Benchmarks (should be one of the "similarity","family","function","affinity","all"): | |
# "similarity" for running protein semantic similarity inference benchmark | |
# "function" for running ontology-based function prediction benchmark | |
# "family" for running drug target protein family classification benchmark | |
# "affinity" for running protein-protein binding affinity estimation benchmark | |
# "all" for running all benchmarks | |
benchmark: all | |
#Path of the file containing representation vectors of UniProtKB/Swiss-Prot human proteins: | |
representation_file_human: ../data/representation_vectors/AAC_UNIPROT_HUMAN.csv | |
#representation_file_human: ../data/representation_vectors/LEARNED-VEC_UNIPROT_HUMAN.csv | |
#representation_file_human: ../data/representation_vectors/T5_UNIPROT_HUMAN.csv | |
#Path of the file containing representation vectors of samples in the SKEMPI dataset: | |
representation_file_affinity: ../data/representation_vectors/skempi_aac_representation_multi_col.csv | |
#representation_file_affinity: ../data/representation_vectors/skempi_learned-vec_representation_multi_col.csv | |
#representation_file_affinity: ../data/representation_vectors/skempi_t5_representation_multi_col.csv | |
#Semantic similarity inference benchmark dataset (should be a list that includes any combination of "Sparse", "200", and "500"): | |
similarity_tasks: ["Sparse","200","500"] | |
#Ontology-based function prediction benchmark dataset in terms of GO aspect (should be one of the following: "MF", "BP", "CC", or "All_Aspects"): | |
function_prediction_aspect: All_Aspects | |
#Ontology-based function prediction benchmark dataset in terms of size-based-splits (should be one of the following: "High", "Middle", "Low", or "All_Data_Sets") | |
function_prediction_dataset: All_Data_Sets | |
#Drug target protein family classification benchmark dataset in terms of similarity-based splits (should be a list that includes any combination of "nc", "uc50", "uc30", and "mm15") | |
family_prediction_dataset: ["nc","uc50","uc30","mm15"] | |
#Detailed results (can be True or False) | |
detailed_output: False | |