DMS_id,DMS_filename,UniProt_ID,taxon,target_seq,seq_len,includes_multiple_mutants,DMS_total_number_mutants,DMS_number_single_mutants,DMS_number_multiple_mutants,DMS_binarization_cutoff,DMS_binarization_method,first_author,title,year,jo,region_mutated,molecule_name,source_organism,selection_assay,selection_type,MSA_filename,MSA_start,MSA_end,MSA_len,MSA_bitscore,MSA_theta,MSA_num_seqs,MSA_perc_cov,MSA_num_cov,MSA_N_eff,MSA_Neff_L,MSA_Neff_L_category,MSA_num_significant,MSA_num_significant_L,raw_DMS_filename,raw_DMS_phenotype_name,raw_DMS_directionality,raw_DMS_mutant_column,weight_file_name,SFT ckpt
A0A2Z5U3Z0_9INFA_Wu_2014,A0A2Z5U3Z0_9INFA_Wu_2014.csv,A0A2Z5U3Z0_9INFA,Virus,MKAKLLVLLYAFVATDADTICIGYHANNSTDTVDTILEKNVAVTHSVNLLEDSHNGKLCKLKGIAPLQLGKCNITGWLLGNPECDSLLPARSWSYIVETPNSENGACYPGDLIDYEELREQLSSVSSLERFEIFPKESSWPNHTFNGVTVSCSHRGKSSFYRNLLWLTKKGDSYPKLTNSYVNNKGKEVLVLWGVHHPSSSDEQQSLYSNGNAYVSVASSNYNRRFTPEIAARPKVRDQHGRMNYYWTLLEPGDTIIFEATGNLIAPWYAFALSRGFESGIITSNASMHECNTKCQTPQGAINSNLPFQNIHPVTIGECPKYVRSTKLRMVTGLRNIPSIQYRGLFGAIAGFIEGGWTGMIDGWYGYHHQNEQGSGYAADQKSTQNAINGITNKVNSVIEKMNTQFTAVGKEFNNLEKRMENLNKKVDDGFLDIWTYNAELLVLLENERTLDFHDLNVKNLYEKVKSQLKNNAKEIGNGCFEFYHKCDNECMESVRNGTYDYPKYSEESKLNREKIDGVKLESMGVYQILAIYSTVASSLVLLVSLGAISFWMCSNGSLQCRICI,565,False,2350,2350,0,0.0947955855,median,Wu,High-throughput profiling of influenza A virus hemagglutinin gene at single-nucleotide resolution,2014,10.1038/srep04942,1-565,HA,Influenza A virus (A/WSN/1933(H1N1)),Viral replication,Growth,A0A2Z5U3Z0_9INFA_theta0.99_full_11-26-2021_b09.a2m,1,565,565,0.9,0.01,57581,0.968,547,9809.4,17.93308958,medium,925,1.691042048,A0A2Z5U3Z0_9INFA_Wu_2014.csv,RF Index,1,mutant,A0A2Z5U3Z0_9INFA_theta_0.01.npy,../results/large_0to10/A0A2Z5U3Z0_9INFA_Wu_2014/sft_best.pt
A4GRB6_PSEAI_Chen_2020,A4GRB6_PSEAI_Chen_2020.csv,A4GRB6_PSEAI,Prokaryote,MFKLLSKLLVYLTASIMAIASPLAFSVDSSGEYPTVSEIPVGEVRLYQIADGVWSHIATQSFDGAVYPSNGLIVRDGDELLLIDTAWGAKNTAALLAEIEKQIGLPVTRAVSTHFHDDRVGGVDVLRAAGVATYASPSTRRLAEVEGNEIPTHSLEGLSSSGDAVRFGPVELFYPGAAHSTDNLIVYVPSASVLYGGCAIYELSRTSAGNVADADLAEWPTSIERIQQHYPEAQFVIPGHGLPGGLDLLKHTTNVVKAHTNRSVVE,266,False,5004,5004,0,-2.1,manual,Chen,"Comprehensive exploration of the translocation, stability and substrate recognition requirements in VIM-2 lactamase",2020,10.7554/eLife.56707,1-266,beta-lactamase VIM-2,Pseudomonas aeruginosa,"drug resistance (128/16/2.0 ug/mL ampicillin, 4.0/0.5 ug/mL cefotaxime, 0.031 ug/mL meropenem @ 25C, 37C)",Antibiotics resistance,A4GRB6_PSEAI_full_11-26-2021_b03.a2m,1,266,266,0.3,0.2,108496,0.726,193,31234.2,161.8352332,high,317,1.642487047,A4GRB6_PSEAI_Chen_2020.csv,0.031ug_mL_MEM_37C,1,mutant,A4GRB6_PSEAI_theta_0.2.npy,../results/large_0to10/A4GRB6_PSEAI_Chen_2020/sft_best.pt
AMIE_PSEAE_Wrenbeck_2017,AMIE_PSEAE_Wrenbeck_2017.csv,AMIE_PSEAE,Prokaryote,MRHGDISSSNDTVGVAVVNYKMPRLHTAAEVLDNARKIAEMIVGMKQGLPGMDLVVFPEYSLQGIMYDPAEMMETAVAIPGEETEIFSRACRKANVWGVFSLTGERHEEHPRKAPYNTLVLIDNNGEIVQKYRKIIPWCPIEGWYPGGQTYVSEGPKGMKISLIICDDGNYPEIWRDCAMKGAELIVRCQGYMYPAKDQQVMMAKAMAWANNCYVAVANAAGFDGVYSYFGHSAIIGFDGRTLGECGEEEMGIQYAQLSLSQIRDARANDQSQNHLFKILHRGYSGLQASGDGDRGLAECPFEFYRTWVTDAEKARENVERLTRSTTGVAQCPVGRLPYEGLEKEA,346,False,6227,6227,0,-0.2222,median,Wrenbeck,Single-mutation fitness landscapes for an enzyme on multiple substrates reveal specificity is globally encoded,2017,10.1038/ncomms15695,1-341,amiE,Pseudomonas aeruginosa,Enzyme function,Growth,AMIE_PSEAE_full_11-26-2021_b02.a2m,1,346,346,0.2,0.2,140703,0.725,251,29959.3,119.359761,high,557,2.219123506,AMIE_PSEAE_Wrenbeck_2017.csv,isobutyramide_normalized_fitness,1,mutant,AMIE_PSEAE_theta_0.2.npy,../results/large_10to20/AMIE_PSEAE_Wrenbeck_2017/sft_best.pt
B3VI55_LIPST_Klesmith_2015,B3VI55_LIPST_Klesmith_2015.csv,LGK_LIPST,Eukaryote,MPIATSTGDNVLDFTVLGLNSGTSMDGIDCALCHFYQKTPDAPMEFELLEYGEVPLAQPIKQRVMRMILEDTTSPSELSEVNVILGEHFADAVRQFAAERNVDLSTIDAIASHGQTIWLLSMPEEGQVKSALTMAEGAIIAARTGITSITDFRISDQAAGRQGAPLIAFFDALLLHHPTKLRACQNIGGIANVCFIPPDVDGRRTDEYYDFDTGPGNVFIDAVVRHFTNGEQEYDKDGAMGKRGKVDQELVDDFLKMPYFQLDPPKTTGREVFRDTLAHDLIRRAEAKGLSPDDIVATTTRITAQAIVDHYRRYAPSQEIDEIFMCGGGAYNPNIVEFIQQSYPNTKIMMLDEAGVPAGAKEAITFAWQGMECLVGRSIPVPTRVETRQHYVLGKVSPGLNYRSVMKKGMAFGGDAQQLPWVSEMIVKKKGKVITNNWA,439,False,7890,7890,0,-0.6245,median,Klesmith,Comprehensive Sequence-Flux Mapping of a Levoglucosan Utilization Pathway in E. coli,2015,10.1021/acssynbio.5b00131,1-439,LGK (levoglucosan kinase),Lipomyces starkeyi (Oleaginous yeast),Growth,Growth,B3VI55_LIPST_full_11-26-2021_b03.a2m,1,439,439,0.3,0.2,31069,0.813,357,7971.0,22.32773109,medium,588,1.647058824,B3VI55_LIPST_Klesmith_2015.csv,SelectionTwo,1,mutant,B3VI55_LIPST_theta_0.2.npy,../results/large_10to20/B3VI55_LIPST_Klesmith_2015/sft_best.pt
BLAT_ECOLX_Stiffler_2015,BLAT_ECOLX_Stiffler_2015.csv,BLAT_ECOLX,Prokaryote,MSIQHFRVALIPFFAAFCLPVFAHPETLVKVKDAEDQLGARVGYIELDLNSGKILESFRPEERFPMMSTFKVLLCGAVLSRVDAGQEQLGRRIHYSQNDLVEYSPVTEKHLTDGMTVRELCSAAITMSDNTAANLLLTTIGGPKELTAFLHNMGDHVTRLDRWEPELNEAIPNDERDTTMPAAMATTLRKLLTGELLTLASRQQLIDWMEADKVAGPLLRSALPAGWFIADKSGAGERGSRGIIAALGPDGKPSRIVVIYTTGSQATMDERNRQIAEIGASLIKHW,286,False,4996,4996,0,-1.159498916,median,Stiffler,Evolvability as a Function of Purifying Selection in TEM-1 β-lactamase,2015,10.1016/j.cell.2015.01.035,24-286,bla,Escherichia coli,Growth (10-2500 ug/mL ampicillin),Growth,BLAT_ECOLX_full_11-26-2021_b02.a2m,1,286,286,0.2,0.2,209644,0.752,215,47605.0,221.4186047,high,446,2.074418605,BLAT_ECOLX_Stiffler_2015.csv,2500,1,mutant,BLAT_ECOLX_theta_0.2.npy,../results/large_10to20/BLAT_ECOLX_Stiffler_2015/sft_best.pt
CP2C9_HUMAN_Amorosi_abundance_2021,CP2C9_HUMAN_Amorosi_abundance_2021.csv,CP2C9_HUMAN,Human,MDSLVVLVLCLSCLLLLSLWRQSSGRGKLPPGPTPLPVIGNILQIGIKDISKSLTNLSKVYGPVFTLYFGLKPIVVLHGYEAVKEALIDLGEEFSGRGIFPLAERANRGFGIVFSNGKKWKEIRRFSLMTLRNFGMGKRSIEDRVQEEARCLVEELRKTKASPCDPTFILGCAPCNVICSIIFHKRFDYKDQQFLNLMEKLNENIKILSSPWIQICNNFSPIIDYFPGTHNKLLKNVAFMKSYILEKVKEHQESMDMNNPQDFIDCFLMKMEKEKHNQPSEFTIESLENTAVDLFGAGTETTSTTLRYALLLLLKHPEVTAKVQEEIERVIGRNRSPCMQDRSHMPYTDAVVHEVQRYIDLLPTSLPHAVTCDIKFRNYLIPKGTTILISLTSVLHDNKEFPNPEMFDPHHFLDEGGNFKKSKYFMPFSAGKRICVGEALAGMELFLFLTSILQNFNLKSLVDPKNLDTTPVVNGFASVPPFYQLCFIPV,490,False,6370,6370,0,0.7723244345,median,Amorosi,Massively parallel characterization of CYP2C9 variant enzyme activity and abundance,2021,10.1016/j.ajhg.2021.07.001,1-490,CP2C9,Homo sapiens,"Growth, activity","Growth, activity",CP2C9_HUMAN_full_11-26-2021_b04.a2m,1,490,490,0.4,0.2,264279,0.886,434,81212.1,187.1246544,high,1092,2.516129032,CP2C9_HUMAN_Amorosi_2021.csv,abundance_score,1,variant,CP2C9_HUMAN_theta_0.2.npy,../results/large_20to30/CP2C9_HUMAN_Amorosi_abundance_2021/sft_best.pt
DLG4_HUMAN_Faure_2021,DLG4_HUMAN_Faure_2021.csv,DLG4_HUMAN,Human,MDCLCIVTTKKYRYQDEDTPPLEHSPAHLPNQANSPPVIVNTDTLEAPGYELQVNGTEGEMEYEEITLERGNSGLGFSIAGGTDNPHIGDDPSIFITKIIPGGAAAQDGRLRVNDSILFVNEVDVREVTHSAAVEALKEAGSIVRLYVMRRKPPAEKVMEIKLIKGPKGLGFSIAGGVGNQHIPGDNSIYVTKIIEGGAAHKDGRLQIGDKILAVNSVGLEDVMHEDAVAALKNTYDVVYLKVAKPSNAYLSDSYAPPDITTSYSQHLDNEISHSSYLGTDYPTAMTPTSPRRYSPVAKDLLGEEDIPREPRRIVIHRGSTGLGFNIVGGEDGEGIFISFILAGGPADLSGELRKGDQILSVNGVDLRNASHEQAAIALKNAGQTVTIIAQYKPEEYSRFEAKIHDLREQLMNSSLGSGTASLRSNPKRGFYIRALFDYDKTKDCGFLSQALSFRFGDVLHVIDASDEEWWQARRVHSDSETDDIGFIPSKRRVERREWSRLKAKDWGSSSGSQGREDSVLSYETVTQMEVHYARPIIILGPTKDRANDDLLSEFPDKFGSCVPHTTRPKREYEIDGRDYHFVSSREKMEKDIQAHKFIEAGQYNSHLYGTSVQSVREVAEQGKHCILDVSANAVRRLQAAHLHPIAIFIRPRSLENVLEINKRITEEQARKAFDRATKLEQEFTECFSAIVEGDSFEEIYHKVKRVIEDLSGPYIWVPARERL,724,True,6976,1280,5696,-0.5602585328,median,Faure,Mapping the energetic and allosteric landscapes of protein binding domains,2022,10.1038/s41586-022-04586-4,311-394,PSD95-PDZ3,Homo sapiens,Yeast growth,Growth,DLG4_HUMAN_full_11-26-2021_b02.a2m,1,724,724,0.2,0.2,25338,0.825,597,354.3,0.5934673367,low,7,0.01172529313,DLG4_HUMAN_Faure_2021.csv,fitness,1,mutant,DLG4_HUMAN_theta_0.2.npy,../results/large_20to30/DLG4_HUMAN_Faure_2021/sft_best.pt
F7YBW8_MESOW_Aakre_2015,F7YBW8_MESOW_Aakre_2015.csv,F7YBW8_MESOW,Prokaryote,MANVEKMSVAVTPQQAAVMREAVEAGEYATASEIVREAVRDWLAKRELRHDDIRRLRQLWDEGKASGRPEPVDFDALRKEARQKLTEVPPNGR,93,True,9192,37,9155,-0.001724,median,Aakre,Evolving New Protein-Protein Interaction Specificity through Promiscuous Intermediates,2015,10.1016/j.cell.2015.09.055,59-64,Mesop_5599,Mesorhizobium opportunistum (strain LMG 24607 / HAMBI 3007 / WSM2075),fitness,Growth (antitoxin neutralization of ParE3),F7YBW8_MESOW_full_01-07-2022_b02.a2m,1,93,93,0.2,0.2,38613,0.774,72,16262.4,225.8666667,high,31,0.4305555556,F7YBW8_MESOW_Aakre_2015.csv,fitness,1,mutant,F7YBW8_MESOW_theta_0.2.npy,../results/large_30to40/F7YBW8_MESOW_Aakre_2015/sft_best.pt
GCN4_YEAST_Staller_induction_2018,GCN4_YEAST_Staller_induction_2018.csv,GCN4_YEAST,Eukaryote,MSEYQPSLFALNPMGFSPLDGSKSTNENVSASTSTAKPMVGQLIFDKFIKTEEDPIIKQDTPSNLDFDFALPQTATAPDAKTVLPIPELDDAVVESFFSSSTDSTPMFEYENLEDNSKEWTSLFDNDIPVTTDDVSLADKAIESTEEVSLVPSNLEVSTTSFLPTPVLEDAKLTQTRKVKKPNSVVKKSHHVGKDDESRLDHLGVVAYNRKQRSIPLSPIVPESSDPAALKRARNTEAARRSRARKLQRMKQLEDKVEELLSKNYHLENEVARLKKLVGER,281,True,2638,33,2605,1.293757864,median,Staller,A High-Throughput Mutational Scan of an Intrinsically Disordered Acidic Transcriptional Activation Domain,2018,10.1016/j.cels.2018.01.015,101-144,Gcn4,Saccharomyces cerevisiae,Binding,FACS,GCN4_YEAST_full_24-02-2022_b03.a2m,1,281,281,0.3,0.2,350,0.719,202,177.9,0.8806930693,low,1,0.00495049505,GCN4_YEAST_Staller_2018.csv,Induction,1,mutant,GCN4_YEAST_theta_0.2.npy,../results/large_30to40/GCN4_YEAST_Staller_induction_2018/sft_best.pt
HSP82_YEAST_Mishra_2016,HSP82_YEAST_Mishra_2016.csv,HSP82_YEAST,Eukaryote,MASETFEFQAEITQLMSLIINTVYSNKEIFLRELISNASDALDKIRYKSLSDPKQLETEPDLFIRITPKPEQKVLEIRDSGIGMTKAELINNLGTIAKSGTKAFMEALSAGADVSMIGQFGVGFYSLFLVADRVQVISKSNDDEQYIWESNAGGSFTVTLDEVNERIGRGTILRLFLKDDQLEYLEEKRIKEVIKRHSEFVAYPIQLVVTKEVEKEVPIPEEEKKDEEKKDEEKKDEDDKKPKLEEVDEEEEKKPKTKKVKEEVQEIEELNKTKPLWTRNPSDITQEEYNAFYKSISNDWEDPLYVKHFSVEGQLEFRAILFIPKRAPFDLFESKKKKNNIKLYVRRVFITDEAEDLIPEWLSFVKGVVDSEDLPLNLSREMLQQNKIMKVIRKNIVKKLIEAFNEIAEDSEQFEKFYSAFSKNIKLGVHEDTQNRAALAKLLRYNSTKSVDELTSLTDYVTRMPEHQKNIYYITGESLKAVEKSPFLDALKAKNFEVLFLTDPIDEYAFTQLKEFEGKTLVDITKDFELEETDEEKAEREKEIKEYEPLTKALKEILGDQVEKVVVSYKLLDAPAAIRTGQFGWSANMERIMKAQALRDSSMSSYMSSKKTFEISPKSPIIKELKKRVDEGGAQDKTVKDLTKLLYETALLTSGFSLDEPTSFASRINRLISLGLNIDEDEETETAPEASTAAPVEEVPADTEMEEVD,709,False,4323,4323,0,-0.4,manual,Mishra,Systematic Mutant Analyses Elucidate General and Client-Specific Aspects of Hsp90 Function,2016,10.1016/j.celrep.2016.03.046,2-231,HSP82,Saccharomyces cerevisiae S288C,Growth,Growth,HSP82_YEAST_full_11-26-2021_b01.a2m,1,709,709,0.1,0.2,38923,0.862,611,3684.8,6.030769231,medium,433,0.7086743044,HSP82_YEAST_Mishra_2016.csv,selection_coefficient,1,mutant,HSP82_YEAST_theta_0.2.npy,../results/large_30to40/HSP82_YEAST_Mishra_2016/sft_best.pt
KKA2_KLEPN_Melnikov_2014,KKA2_KLEPN_Melnikov_2014.csv,KKA2_KLEPN,Prokaryote,MIEQDGLHAGSPAAWVERLFGYDWAQQTIGCSDAAVFRLSAQGRPVLFVKTDLSGALNELQDEAARLSWLATTGVPCAAVLDVVTEAGRDWLLLGEVPGQDLLSSHLAPAEKVSIMADAMRRLHTLDPATCPFDHQAKHRIERARTRMEAGLVDQDDLDEEHQGLAPAELFARLKARMPDGEDLVVTHGDACLPNIMVENGRFSGFIDCGRLGVADRYQDIALATRDIAEELGGEWADRFLVLYGIAAPDSQRIAFYRLLDEFF,264,False,4960,4960,0,0.5,manual,Melnikov,Comprehensive mutational scanning of a kinasein vivoreveals substrate-dependent fitness landscapes,2014,10.1093/nar/gku511,1-264,"APH(3’)II, neo",Klebsiella pneumoniae,"Growth (225 ug/mL kanamycin) 1:1, 1:2, 1:4, 1:8 dilutions",Growth,KKA2_KLEPN_full_11-26-2021_b02.a2m,1,264,264,0.2,0.2,234760,0.795,210,76876.7,366.0795238,high,377,1.795238095,KKA2_KLEPN_Melnikov_2014.csv,Kan18_avg,1,mutant,KKA2_KLEPN_theta_0.2.npy,../results/large_40to50/KKA2_KLEPN_Melnikov_2014/sft_best.pt
NUD15_HUMAN_Suiter_2020,NUD15_HUMAN_Suiter_2020.csv,NUD15_HUMAN,Human,MTASAQPRGRRPGVGVGVVVTSCKHPRCVLLGKRKGSVGAGSFQLPGGHLEFGETWEECAQRETWEEAALHLKNVHFASVVNSFIEKENYHYVTILMKGEVDVTHDSEPKNVEPEKNESWEWVPWEELPPLDQLFWGLRCLKEQGYDPFKEDLNHLVGYKGNHL,164,False,2844,2844,0,0.25,manual,Suiter,Massively parallel variant characterization identifies NUDT15 alleles associated with thiopurine toxicity,2020,10.1073/pnas.1915680117,2-164,NUDT15,Homo sapiens,,"VAMP-seq, drug sensitivity",NUD15_HUMAN_full_11-26-2021_b04.a2m,1,164,164,0.4,0.2,153922,0.72,118,43847.8,371.5915254,high,151,1.279661017,NUD15_HUMAN_Suiter_2020.csv,Final NUDT15 activity Score,1,mutant,NUD15_HUMAN_theta_0.2.npy,../results/large_40to50/NUD15_HUMAN_Suiter_2020/sft_best.pt
P53_HUMAN_Giacomelli_NULL_Etoposide_2018,P53_HUMAN_Giacomelli_NULL_Etoposide_2018.csv,P53_HUMAN,Human,MEEPQSDPSVEPPLSQETFSDLWKLLPENNVLSPLPSQAMDDLMLSPDDIEQWFTEDPGPDEAPRMPEAAPRVAPAPAAPTPAAPAPAPSWPLSSSVPSQKTYQGSYGFRLGFLHSGTAKSVTCTYSPALNKMFCQLAKTCPVQLWVDSTPPPGTRVRAMAIYKQSQHMTEVVRRCPHHERCSDSDGLAPPQHLIRVEGNLRVEYLDDRNTFRHSVVVPYEPPEVGSDCTTIHYNYMCNSSCMGGMNRRPILTIITLEDSSGNLLGRNSFEVRVCACPGRDRRTEEENLRKKGEPHHELPPGSTKRALPNNTSSSPQPKKKPLDGEYFTLQIRGRERFEMFRELNEALELKDAQAGKEPGGSRAHSSHLKSKKGQSTSRHKKLMFKTEGPDSD,393,False,7467,7467,0,-0.5,manual,Giacomelli,Mutational processes shape the landscape of TP53 mutations in human cancer,2018,10.1038/s41588-018-0204-y,1-393,TP53,Homo sapiens,"drug resistance (nutlin-3, etoposide)",Growth,P53_HUMAN_full_04-29-2022_b09.a2m,1,393,393,0.9,0.2,5069,0.858,337,153.2,0.4545994065,low,7,0.02077151335,P53_HUMAN_Giacomelli_2018.csv,A549_p53NULL_Etoposide_Z-score,1,Allele,P53_HUMAN_theta_0.2.npy,../results/large_40to50/P53_HUMAN_Giacomelli_NULL_Etoposide_2018/sft_best.pt
P53_HUMAN_Giacomelli_NULL_Nutlin_2018,P53_HUMAN_Giacomelli_NULL_Nutlin_2018.csv,P53_HUMAN,Human,MEEPQSDPSVEPPLSQETFSDLWKLLPENNVLSPLPSQAMDDLMLSPDDIEQWFTEDPGPDEAPRMPEAAPRVAPAPAAPTPAAPAPAPSWPLSSSVPSQKTYQGSYGFRLGFLHSGTAKSVTCTYSPALNKMFCQLAKTCPVQLWVDSTPPPGTRVRAMAIYKQSQHMTEVVRRCPHHERCSDSDGLAPPQHLIRVEGNLRVEYLDDRNTFRHSVVVPYEPPEVGSDCTTIHYNYMCNSSCMGGMNRRPILTIITLEDSSGNLLGRNSFEVRVCACPGRDRRTEEENLRKKGEPHHELPPGSTKRALPNNTSSSPQPKKKPLDGEYFTLQIRGRERFEMFRELNEALELKDAQAGKEPGGSRAHSSHLKSKKGQSTSRHKKLMFKTEGPDSD,393,False,7467,7467,0,0.04438920187,median,Giacomelli,Mutational processes shape the landscape of TP53 mutations in human cancer,2018,10.1038/s41588-018-0204-y,1-393,TP53,Homo sapiens,"drug resistance (nutlin-3, etoposide)",Growth,P53_HUMAN_full_04-29-2022_b09.a2m,1,393,393,0.9,0.2,5069,0.858,337,153.2,0.4545994065,low,7,0.02077151335,P53_HUMAN_Giacomelli_2018.csv,A549_p53NULL_Nutlin-3_Z-score,-1,Allele,P53_HUMAN_theta_0.2.npy,../results/large_40to50/P53_HUMAN_Giacomelli_NULL_Nutlin_2018/sft_best.pt
P53_HUMAN_Giacomelli_WT_Nutlin_2018,P53_HUMAN_Giacomelli_WT_Nutlin_2018.csv,P53_HUMAN,Human,MEEPQSDPSVEPPLSQETFSDLWKLLPENNVLSPLPSQAMDDLMLSPDDIEQWFTEDPGPDEAPRMPEAAPRVAPAPAAPTPAAPAPAPSWPLSSSVPSQKTYQGSYGFRLGFLHSGTAKSVTCTYSPALNKMFCQLAKTCPVQLWVDSTPPPGTRVRAMAIYKQSQHMTEVVRRCPHHERCSDSDGLAPPQHLIRVEGNLRVEYLDDRNTFRHSVVVPYEPPEVGSDCTTIHYNYMCNSSCMGGMNRRPILTIITLEDSSGNLLGRNSFEVRVCACPGRDRRTEEENLRKKGEPHHELPPGSTKRALPNNTSSSPQPKKKPLDGEYFTLQIRGRERFEMFRELNEALELKDAQAGKEPGGSRAHSSHLKSKKGQSTSRHKKLMFKTEGPDSD,393,False,7467,7467,0,-1.0,manual,Giacomelli,Mutational processes shape the landscape of TP53 mutations in human cancer,2018,10.1038/s41588-018-0204-y,1-393,TP53,Homo sapiens,"drug resistance (nutlin-3, etoposide)",Growth,P53_HUMAN_full_04-29-2022_b09.a2m,1,393,393,0.9,0.2,5069,0.858,337,153.2,0.4545994065,low,7,0.02077151335,P53_HUMAN_Giacomelli_2018.csv,A549_p53WT_Nutlin-3_Z-score,-1,Allele,P53_HUMAN_theta_0.2.npy,../results/large_50to60/P53_HUMAN_Giacomelli_WT_Nutlin_2018/sft_best.pt
Q59976_STRSQ_Romero_2015,Q59976_STRSQ_Romero_2015.csv,Q59976_STRSQ,Prokaryote,MVPAAQQTAMAPDAALTFPEGFLWGSATASYQIEGAAAEDGRTPSIWDTYARTPGRVRNGDTGDVATDHYHRWREDVALMAELGLGAYRFSLAWPRIQPTGRGPALQKGLDFYRRLADELLAKGIQPVATLYHWDLPQELENAGGWPERATAERFAEYAAIAADALGDRVKTWTTLNEPWCSAFLGYGSGVHAPGRTDPVAALRAAHHLNLGHGLAVQALRDRLPADAQCSVTLNIHHVRPLTDSDADADAVRRIDALANRVFTGPMLQGAYPEDLVKDTAGLTDWSFVRDGDLRLAHQKLDFLGVNYYSPTLVSEADGSGTHNSDGHGRSAHSPWPGADRVAFHQPPGETTAMGWAVDPSGLYELLRRLSSDFPALPLVITENGAAFHDYADPEGNVNDPERIAYVRDHLAAVHRAIKDGSDVRGYFLWSLLDNFEWAHGYSKRFGAVYVDYPTGTRIPKASARWYAEVARTGVLPTAGDPNSSSVDKLAAALEHHHHHH,501,False,2999,2999,0,-1.0,manual,Romero,Dissecting enzyme function with microfluidic-based deep mutational scanning,2015,10.1073/pnas.1422285112,1-501,β-glucosidase,Streptomyces sp.,Enzyme function,Activity,Q59976_STRSQ_full_11-26-2021_b03.a2m,1,501,501,0.3,0.2,105913,0.882,442,13981.2,31.63167421,medium,850,1.923076923,Q59976_STRSQ_Romero_2015.csv,enrichment,1,mutant,Q59976_STRSQ_theta_0.2.npy,../results/large_60to70/Q59976_STRSQ_Romero_2015/sft_best.pt
RASH_HUMAN_Bandaru_2017,RASH_HUMAN_Bandaru_2017.csv,RASH_HUMAN,Human,MTEYKLVVVGAGGVGKSALTIQLIQNHFVDEYDPTIEDSYRKQVVIDGETCLLDILDTAGQEEYSAMRDQYMRTGEGFLCVFAINNTKSFEDIHQYREQIKRVKDSDDVPMVLVGNKCDLAARTVESRQAQDLARSYGIPYIETSAKTRQGVEDAFYTLVREIRQHKLRKLNPPDESGPGCMSCKCVLS,189,False,3134,3134,0,-0.25,manual,Bandaru,Deconstruction of the Ras switching cycle through saturation mutagenesis,2017,10.7554/eLife.27810,1-161,HRAS,Homo sapiens,C-Raf binding and GEF,activity,RASH_HUMAN_full_11-26-2021_b03.a2m,1,189,189,0.3,0.2,204751,0.862,163,23971.6,147.0650307,high,205,1.257668712,RASH_HUMAN_Bandaru_2017.csv,unregulated,1,mutant,RASH_HUMAN_theta_0.2.npy,../results/large_60to70/RASH_HUMAN_Bandaru_2017/sft_best.pt
REV_HV1H2_Fernandes_2016,REV_HV1H2_Fernandes_2016.csv,REV_HV1H2,Virus,MAGRSGDSDEELIRTVRLIKLLYQSNPPPNPEGTRQARRNRRRRWRERQRQIHSISERILSTYLGRSAEPVPLQLPPLERLTLDCNEDCGTSGTQGVGSPQILVESPTVLESGTKE,116,False,2147,2147,0,-0.06744744968,median,Fernandes,Functional Segregation of Overlapping Genes in HIV,2016,10.1016/j.cell.2016.11.031,1-116,rev,Human immunodeficiency virus type 1 group M subtype B (isolate BRU/LAI) (HIV-1),Viral replication,Growth,REV_HV1H2_full_theta0.99_04-29-2022_b09.a2m,1,116,116,0.9,0.01,15839,0.948,110,9951.8,90.47090909,medium,54,0.4909090909,REV_HV1H2_Fernandes_2016.csv,sel_coeff_mean,1,mutant,REV_HV1H2_theta_0.01.npy,../results/large_60to70/REV_HV1H2_Fernandes_2016/sft_best.pt
TPK1_HUMAN_Weile_2017,TPK1_HUMAN_Weile_2017.csv,TPK1_HUMAN,Human,MEHAFTPLEPLLSTGNLKYCLVILNQPLDNYFRHLWNKALLRACADGGANRLYDITEGERESFLPEFINGDFDSIRPEVREYYATKGCELISTPDQDHTDFTKCLKMLQKKIEEKDLKVDVIVTLGGLAGRFDQIMASVNTLFQATHITPFPIIIIQEESLIYLLQPGKHRLHVDTGMEGDWCGLIPVGQPCMQVTTTGLKWNLTNDVLAFGTLVSTSNTYDGSGVVTVETDHPLLWTMAIKS,243,False,3181,3181,0,0.5,manual,Weile,A framework for exhaustively mapping functional missense variants,2017,10.15252/msb.20177908,1-243,Thiamin pyrophosphokinase 1,Homo sapiens,Yeast growth,complementation,TPK1_HUMAN_full_11-26-2021_b02.a2m,1,243,243,0.2,0.2,21515,0.823,200,7122.6,35.613,medium,234,1.17,TPK1_HUMAN_Weile_2017.csv,screenscore,1,mutant,TPK1_HUMAN_theta_0.2.npy,../results/large_70to80/TPK1_HUMAN_Weile_2017/sft_best.pt
VKOR1_HUMAN_Chiasson_abundance_2020,VKOR1_HUMAN_Chiasson_abundance_2020.csv,VKOR1_HUMAN,Human,MGSTWGSPGWVRLALCLTGLVLSLYALHVKAARARDRDYRALCDVGTAISCSRVFSSRWGRGFGLVEHVLGQDSILNQSNSIFGCIFYTLQLLLGCLRTRWASVLMLLSSLVSLAGSVYLAWILFFVLYDFCIVCITTYAINVSLMWLSFRKVQEPQGKAKRH,163,False,2695,2695,0,0.7480893367,median,Chiasson,"Multiplexed measurement of variant abundance and activity reveals VKOR topology, active site and human variant impact",2020,10.7554/eLife.58026,2-163,VKORC1,Homo sapiens,protein stability (eGFP fusion reporter),,VKOR1_HUMAN_full_11-26-2021_b03.a2m,1,163,163,0.3,0.2,14510,0.779,127,4655.0,36.65354331,medium,97,0.7637795276,VKOR1_HUMAN_Chiasson_2020.csv,abundance_score,1,variant,VKOR1_HUMAN_theta_0.2.npy,../results/large_80to87/VKOR1_HUMAN_Chiasson_abundance_2020/sft_best.pt
