Gonohhrea Augmented Dataset
Predicting Antibiotic Resistance Genes
@kaggle.salmaneunus_gonohhrea_augmented_dataset
Predicting Antibiotic Resistance Genes
@kaggle.salmaneunus_gonohhrea_augmented_dataset
This dataset has been preprocessed for ML training. First of all, the class imbalance problem has been fixed by applying CTGAN. Then feature selection techniques and PCA have been applied for dimensionality reduction. It contains features as unitigs, which are short strands of DNA, and the dataset records whether the specific strands of genes are present or not in the specific sample. The presence or absence of thousands of unitigs indicates whether the antibiotic will be resistant or susceptible.
CREATE TABLE x_train_augmented_azm (
"unnamed_0" VARCHAR -- Unnamed: 0,
"cttaacatatttgcctttgatttttgaagaagctgccacgccggcag" BIGINT,
"taccgtaaccggcaatgcggatattacggtc" BIGINT,
"cagacggcattttttttgcgtttttcgggagg" BIGINT,
"aacgggttttcagacggcattcgatatcgggacg" BIGINT,
"ccaaaaattacccgcgttgacgtagctaaaga" BIGINT,
"cggaccggtattccgtcgaaatcaccgccgtcaaccgcccc" BIGINT,
"tgaaattgtccatctcgtatgccgtcttctgcttg" BIGINT,
"tacggtattgtccgcattattaaactcaaaacc_agaagacggcatacgagatg_42cccb6f" BIGINT -- TACGGTATTGTCCGCATTATTAAACTCAAAACC,AGAAGACGGCATACGAGATGGACAATTTCATCC,
"ggcattttttttgcgtttttcgggagggggcggc" BIGINT,
"tatataaggggttgccgttccgcagttgggcggcagcatac" BIGINT,
"tggtaatgccgggtgagaacgtaaccattactgtagaactgattgcg" BIGINT,
"acgctttgaacatatttgcctttgatttcgg" BIGINT,
"ttatgaacaaaccattggtgaatcaggctgctatggt" BIGINT,
"acggcgacggcagcggcgacggcgacggcaacggca" BIGINT,
"cgcatgggcaagcaggtcgagatattcgccg" BIGINT,
"cctggcaaacgcttccccgtcgccctcgaaca" BIGINT,
"gtctgatttcacaagtcttgtgaagtcttacctgccttaccgtccaacatccgccgcagcc" BIGINT,
"agcttggatatgtccaatcctacagtgttacg" BIGINT,
"ccactatgctgacacccgaacaagtcaaggcc" BIGINT,
"tgccgtcttctgcttgaaaaaaaaaaagcac" BIGINT,
"ataaagatgagataacggctttgattaatagtcttaaataaaggggc" BIGINT,
"cagtttgaagtagcgcgcggcggcaacggcgtaaatcagtgcctg" BIGINT,
"gaagatgcaatctacccgctgctagacggaaagaccc" BIGINT,
"aacggcacattccacgccgtttcttctctcg" BIGINT,
"gtcgtaatcaccgccctgccgaccgccatggcctcctggg" BIGINT,
"aaggctttcatcattcgcttctcggtcgctgcgcatacccg" BIGINT,
"caaacaaactggggatattatatgcatatcct" BIGINT,
"taccggtttaaatttaattcactatacatcccgt" BIGINT,
"accgtaatatccgcattgccggttacggtat" BIGINT,
"aaaatggaaagatatgcatataatatccccg" BIGINT,
"ctgcccttggctttggcgcgttatttgccgcacaagcggctcaaagc" BIGINT,
"gtgaagggtcggcaggtttgaccgtaatatccgc" BIGINT,
"acacaaccgccttccggccatgccggcggggaaacaaggcgcaaacacgcggggcgggacg" BIGINT,
"gaaaccctcctgaccgacaaccgcatctggaaacag" BIGINT,
"acgccgacgacgccgtcaaagacgacgccga" BIGINT,
"gacgcagcagctacggtttatcctgacggatatccgc" BIGINT,
"aaatgtcagcttggatatgtccaatcctacagt" BIGINT,
"actatgctgacacccgaacaagtcaaggccc" BIGINT,
"aatatccgcattgccggttacggtattgtcc" BIGINT,
"aaatacgcaaagcacctatcgcgaaagcgacagcatccg" BIGINT,
"atgcatataatatccccagtttgtttgttga" BIGINT,
"aatgccctctccccggcccgccattgccgcgcaggcg" BIGINT,
"tcttctgtcgtatagacgaggttttgattac" BIGINT,
"tggaaagaaagaataataaaactcctggcgtcgaccagcttaacataaaatacc" BIGINT,
"tcccgaaaaacgcaaaaaaaatgccgtctgaagacctttcggac" BIGINT,
"aaaccggtacggcgttgcctcgccttttcgtactat" BIGINT,
"aaaacctcgtctatacgacagaagaccaccgtattt" BIGINT,
"aagccgagagaagaaacggcgtggaatgtgcc" BIGINT,
"gcccgtcccgatatcgaatgccgtctgaaaacc" BIGINT,
"cccgcgataaatgctatttcagtcaatcgtac" BIGINT,
"gattatccggagcgaccgtaacgaaccaaacaaaaacc" BIGINT,
"ccgcctgcgcggcaatggcgggccggggaga" BIGINT,
"atggtaatgccgggtgagaacgtaaccatta_aagcagttgttttaacaggaca_069e0b31" BIGINT -- ATGGTAATGCCGGGTGAGAACGTAACCATTA,AAGCAGTTGTTTTAACAGGACAATCTGGTCGGGG,
"ccaaaagacggaaaatcaggaaaacggcagcttc" BIGINT,
"tgatgaaagccgggccatggcattctccgaaatccaaaaa" BIGINT,
"cggataatcagccctttcgggcgcgaatgctgtgaag" BIGINT,
"gcaacttggagaatgccctctccccggcccgcc" BIGINT,
"ggagaatgccctctccccggcccgccattgccgc" BIGINT,
"caatgcggatattacggtcaaacctgccgaccct" BIGINT,
"ccttttgatgaagtcgggaaatgcccttatc" BIGINT,
"gcgccaaaatttccgatgtgctgcccgccgccg" BIGINT,
"cactataccggccggatgaaattgtccatctcgtatgccgtct" BIGINT,
"ttacgcgcgccgacaacgccgacaacgacgacgt" BIGINT,
"cgcgccaaaatttccgatgtgctgcccgccg" BIGINT,
"tatgccgtcttctgcttgaaaaaaaaaaagca" BIGINT,
"cggatgtatcagaaaggagaataaattgcaacctttagtcagcgt" BIGINT,
"taacactgtaggattggacatatccaagctgac" BIGINT,
"atatccgcattgccggttacggtattgtccg" BIGINT,
"aacggcgtggaatgtgccgttttcctgatgt" BIGINT,
"aagcaaaacccccgccaaacgccaatctgcccgggggtttcgagatacaacatgagccaat" BIGINT,
"cgaaaaggcgaggcaacgccgtaccggtttaaat" BIGINT,
"ccccccccccatcaaatgaatggcagattga" BIGINT,
"gtcgagatattcgccgcgcaacggcgagaatacgccgaaag" BIGINT,
"ggtgaacttgcagtttttcaacaaacaaaccggggatattat" BIGINT,
"gcgcgacaacgccaaagacgccgacgacgccgtcaaagac" BIGINT,
"acccgccaacccgaccgccgtgattcccgcg" BIGINT,
"acccccatcgatccgtccagcctgaagcagcagtcggcagg" BIGINT,
"agggcggcaaaggcgggctttcgtcccccacg" BIGINT,
"cggcgtcgtctttgacggcgtcgtcggcgtc" BIGINT,
"tttggggcatgtgtaaatccgtgcttgtgggtaattttaacgctcgacgataatcttcccg" BIGINT,
"atatccccagtttgtttgttgaaaaactgca" BIGINT,
"atattccgtgaacataaaagagttgaaaaaaaagaataataaaacttctggcggcg" BIGINT,
"acaaactggggatattatatgcatatccttc_agcgaatgatgaaagccttaac_6ae905c7" BIGINT -- ACAAACTGGGGATATTATATGCATATCCTTC,AGCGAATGATGAAAGCCTTAACGCCCTTGGGCGAAAGG,CGAATGCCGTCTGAAAACCCGTTGACGGCGC,
"tatatattgcgtaacactgtaggattggacatatc" BIGINT,
"tccgtcgaaattaccgccgtcaaccgccccttcctgctcgcc_acactataccg_787d6ca3" BIGINT -- TCCGTCGAAATTACCGCCGTCAACCGCCCCTTCCTGCTCGCC,ACACTATACCGGCCGGATGAAATTGTCCATC,
"gcgcgtcaagccaaagccggtcgcattatcaccattgataccaatcctgcaaaa_40657557" BIGINT -- GCGCGTCAAGCCAAAGCCGGTCGCATTATCACCATTGATACCAATCCTGCAAAATTCGAGT,TATCGGATGCCGTCTGAAGCGGAAATGTGAA,AACGTAACCATTACTGTAGAACTGATTGCGCCTATCGCTATGG,
"gcccagtcgagaacagcaaagcaacgcgggcatgcgtagcgaccgagaagcgaatg" BIGINT,
"tacggcgaaggcactaaaatggaaagatatgcatataat" BIGINT,
"aagaaacggcgtggaatgtgccgttttcctga" BIGINT,
"attaatagtcttaaataaaggggctgtaccggat" BIGINT,
"taattaaaaacaacatggtaatcaataatgacgatgaacccaccacccaatactacagcc" BIGINT,
"catggcattctccgaaatccaaaaacggaaa_gcatcgtaccatcccgacagga_e6b61f49" BIGINT -- CATGGCATTCTCCGAAATCCAAAAACGGAAA,GCATCGTACCATCCCGACAGGAAACATCATACACATACTGACCGCCGGCGTGGACGAGGCA,AGGTTCTAGATTCCCGTTTTCACGGCAATGACG,
"gtctgaaaacccgttgacggcgcatgggcaagcagg" BIGINT,
"caataccgtaaccggcaatgcggatattacg" BIGINT,
"caactgcggaacggcaaccccttatatattgcgtaa" BIGINT,
"atataatatccccagtttgtttgttgaaaaa_gcactaaaatggaaagatatgc_13c7ce18" BIGINT -- ATATAATATCCCCAGTTTGTTTGTTGAAAAA,GCACTAAAATGGAAAGATATGCATATAATATCCCC,ATTGCCGGTTACGGTATTGTCCGCATTATTAAA,ATTTGACCCGCCAACCCGACCGCCGTGATTCCCG,GCAATTTTTCGTCATTGCCGTGAAAACGGGAATCTA,
"cgccgacgacgccgtcaaagacgacgccgac" BIGINT,
"atctcgtatgccgtcttctgcttgaaaaaaa" BIGINT,
"caacaaaataccatccttttcgaactgaccggaaccggttgcggcgtcgcaaaa_89083650" BIGINT -- CAACAAAATACCATCCTTTTCGAACTGACCGGAACCGGTTGCGGCGTCGCAAAAGAAGGCTGGGAATC
);
CREATE TABLE x_train_augmented_cip (
"unnamed_0" VARCHAR -- Unnamed: 0,
"acgtttatgccgttatcgatccgatagccggt" BIGINT,
"catctgcaccctgtcggcactcgccgcctgaaccaccccgtccggacaagg" BIGINT,
"cacaaaactcgtttcctgctccgaaatgggcga_gtaagggctttcttaaattt_c62900b4" BIGINT -- CACAAAACTCGTTTCCTGCTCCGAAATGGGCGA,GTAAGGGCTTTCTTAAATTTGATTAAAGGTCGTCTGAA,AACCGAAACCGACCGCGCCGTCGAATATCAGGCGGTCGCACCGGAAGTACG,
"aaatcttccgctttaatccatttgccgtccga" BIGINT,
"aaacctgccgcagccggcgcatctttgggcggcggtctggac_aacgtggtgta_c280dd17" BIGINT -- AAACCTGCCGCAGCCGGCGCATCTTTGGGCGGCGGTCTGGAC,AACGTGGTGTACCAAACCCGCCGTTTCGACCGTTATAAAGAA,
"cccaacacactcgacgtatggatgagccacggc" BIGINT,
"ttttcaacaaaaaactgcttgtccaacggcaaa" BIGINT,
"tttcaaccggatagctgaaaaaacaaaaaagttcgata" BIGINT,
"catcacttcccgctgccgtttttttgtttcagacggcat" BIGINT,
"aaactgcttgtccaacggcaaaccggcgggcagg_cacatagaaaagcggaaca_023610f0" BIGINT -- AAACTGCTTGTCCAACGGCAAACCGGCGGGCAGG,CACATAGAAAAGCGGAACAAGGAACACGGATAAAAGCGT,TTTCCTCCGACCATACAGAAGATACCATACGCCTCTCCAAACGTATGG,AGAAAGTGGAATTGAGGAAACCTTTTTATCCGATGAG,TGGATATAGTCTTTTAATTCGTCTTTCGTCGCCCAAGCAGTGCCATAA,
"caggcaccgattaacggcaacgatccctatgctaatg" BIGINT,
"aagaaaccgttttacccgataagtttctgtgccgaca" BIGINT,
"agccttgccgtaaatgccttcaagacatgcgg" BIGINT,
"cgaccaaaacgtgcagggctacattaaaaacctgccgctgcggcata_cggcaa_871cc413" BIGINT -- CGACCAAAACGTGCAGGGCTACATTAAAAACCTGCCGCTGCGGCATA,CGGCAACGTTGAAGACGGCTTCGACGGTTTCGGCG,
"acgattcggatggtttcgagataaaaccgtc" BIGINT,
"aatgtcaaactggcagaccaacgccacccgaagacaggcgtaccgtttg" BIGINT,
"aaaaatcatagccgtcatcgggcaactcgtc" BIGINT,
"aaagacccgtctttgaccaaagaagaactcaccgctttctgccgtac_aaccaa_b98a13d5" BIGINT -- AAAGACCCGTCTTTGACCAAAGAAGAACTCACCGCTTTCTGCCGTAC,AACCAATAAAAACCATATGCCCGAAAACAGCATCATTGCCGAATATTTCATTCGTTCGGCA,
"caccggcatctgcccccactgcatcaacccgcct" BIGINT,
"accaaacaactgaccggttgaaaactgccgaaatgccgtctgaaacgtttcaga_a9eacf56" BIGINT -- ACCAAACAACTGACCGGTTGAAAACTGCCGAAATGCCGTCTGAAACGTTTCAGACGGCAT,AACCGCGCCCACGCCTACAAAGCCGCCGTTCAAGCCAATGCGGAAAACGGGCAGGAAGA,GCCCGACAGCCCGACCCAGCGCGTCGGCGGCGAGCCTTTG,GCAGGCTTTCTTCAAACCGATGGCGTGTGCGGCATTTCTGTCCGCCGTTTCGC,CCGAACACGCCGGCAGCGTGTGGATGATGGTGCAG,AATAAAAAGGCCGTCTGAAACATATCCTTTTCAG,
"aattggtcggacgttatcattcgggttgttatgtatc" BIGINT,
"caccctacccctgtaaacatcacgatttgccgg" BIGINT,
"gtgccggaacagcccgccctgccaaacaaatgccgtctgaaaccggaaaa_gaa_5291ef67" BIGINT -- GTGCCGGAACAGCCCGCCCTGCCAAACAAATGCCGTCTGAAACCGGAAAA,GAAGAAGCGGAAGGCGACGTACTCAAACGTGCCCAAGCA,AACTGGTCGAGATTGATGCCGTTCGCATCCGCCA,
"aaaaaaatcctaaagggcgagctgattaaaa" BIGINT,
"actacatcggtttcctcgccgatggagcggaca" BIGINT,
"ccatcacggaaaaacccgtaccgttgtagtccgacatttc" BIGINT,
"cgaaagcaggctttcggcatagacggacgacagccgttcgtcaacccaat_ctg_63ccf7c1" BIGINT -- CGAAAGCAGGCTTTCGGCATAGACGGACGACAGCCGTTCGTCAACCCAAT,CTGTTTTTCGGCAATCATCACCACATCGATGCTCGAACAGCCCGCCAC,CGGACACAACGGGCGCGGAAGATAAAGCTGAAATTGTCGGAA,
"cctttcaaaccgtgcatcagcccgaggctgtggcggac_acatacaaaacgccg_ec082207" BIGINT -- CCTTTCAAACCGTGCATCAGCCCGAGGCTGTGGCGGAC,ACATACAAAACGCCGCCCTCCGCCTTCTGCAACA,CATCCGCGTGAACCATCCTTTGACCTTGCACGGC,
"gatatattgggaaacgaacggaatcagaatctgcc" BIGINT,
"cgtctgaagtgatttcgcgccccagccagtc_gtaatcgatgaagaaggcttcg_5f670041" BIGINT -- CGTCTGAAGTGATTTCGCGCCCCAGCCAGTC,GTAATCGATGAAGAAGGCTTCGCGTTTGCGGGTG,
"aaccggtgagaaactcgagcgcaccatccgcgtgaaccatcctttgaccttg" BIGINT,
"acgggggagggagcagattgcggcagatttgg" BIGINT,
"cagcaaaccgttccgcttcaacgcgcgtacttgggaat" BIGINT,
"cggcgcagggttgagctacgcgggtaaagccgcagg" BIGINT,
"atattgtagtgttcgccataacagacctgaaaatcatc" BIGINT,
"aaaataaaatcacaattatgcgaataaagtttgtataaatttctcctaac" BIGINT,
"ggttgaaaacacaaaacaggatcaggacgacaacgcggacga" BIGINT,
"gaaacaggtggacggcacggcggtcaattaccgg_gatttggacaatgacgcgc_4b38204a" BIGINT -- GAAACAGGTGGACGGCACGGCGGTCAATTACCGG,GATTTGGACAATGACGCGCTGCTGCGTGCCATCGCCG,AAAGTGGTTCACGTCGGCTTTGCCGTTGGGATACAC,ACCATCAAACCTACATCACCAACCTGAACAATCAA,
"acaagacgacaggcggcggaacacgtcgtcg_cgggcagccgaaggtatggccg_e2b627ff" BIGINT -- ACAAGACGACAGGCGGCGGAACACGTCGTCG,CGGGCAGCCGAAGGTATGGCCGCAGTCGCCGCAAAACAGCGCAGGCGC,
"gctccaatcgcgataccggtaaagatgtacgcc" BIGINT,
"gacacctgcgccgtggtcacctacgcaatgcggcgtgttcactaaaatatcgacttctttg" BIGINT,
"cccatgtgctgcggttgtccagtttggacggcag" BIGINT,
"ttcgacttcgcgctcacggggcagaccatgcgccacgaccaccg_tgctgtccg_9d08c234" BIGINT -- TTCGACTTCGCGCTCACGGGGCAGACCATGCGCCACGACCACCG,TGCTGTCCGAAATGGAAAGCGGTTTAAGCCCC,
"aattacccgttccgggcaaaatttccgttaccccgaccaaatctctggc_agga_ed92c3e3" BIGINT -- AATTACCCGTTCCGGGCAAAATTTCCGTTACCCCGACCAAATCTCTGGC,AGGATCAACTTGTTGAGCTTCCAAAACCAACACGTTTGGCAAGTTGCGTGAAGCCAAGTAA,GCGCGCAAAAACGAAGGTTATTGGATTACCATTTTCCCC,CGCACCATAAACTTCAATGCCGCCGGCCGGATAGGCACCATGATAAAGCTGT,
"ttgcttggtgatttgttcgataacctgctcatcgccgtgggtaacgatggtcatccgtgac" BIGINT,
"gcctttgcgtccgttgtttttcgtcagggcgg" BIGINT,
"aaacagttgtacgctttcacccacgggcggcaggttgtagaaggt" BIGINT,
"taccgccccggacggatccgaagcggcgggcggt" BIGINT,
"aactttagcaaaactttctgccgaaaaaggctgg_caggacgataaacaaaatg_987c3ef6" BIGINT -- AACTTTAGCAAAACTTTCTGCCGAAAAAGGCTGG,CAGGACGATAAACAAAATGCTGCCGGCGAGGAATATTTCGTTCGATCCGATGATG,
"caaacatcaccacaatggagttcaagggcgat" BIGINT,
"aaccgccgcaggattgcctcaaccctatctgtcccgcatcgaaaa" BIGINT,
"tgaaattaaacgaaaaacaccgctatgccgtgat" BIGINT,
"acaaaacggcgcagtgccgcgcaaagccaaaatattcgccatcagtatgatgac_36a587b0" BIGINT -- ACAAAACGGCGCAGTGCCGCGCAAAGCCAAAATATTCGCCATCAGTATGATGACCGCATCCTGCCTGATAATGTTTTGGCAGTTTCCCCAACGCTGGTGG,
"gggataccgtatcagtatgggttgggggaatcagg" BIGINT,
"caaccgccctgccgtcgttgaagcggataaagccgg" BIGINT,
"tatgacgcaagaacgtttacccgaatttttcgacc_ggatttcgtgtgccagcc_660e0ec5" BIGINT -- TATGACGCAAGAACGTTTACCCGAATTTTTCGACC,GGATTTCGTGTGCCAGCCGCTTCGCCACTTCACCCCA,ATAAAGTAACGCAGGTTTTAATTGCTGTCCCAAAATGTCCGATAG,
"ttatgcgacgcgccgaaagtatgcgtgacggactg_aggcacgaggctgccgat_e1c0fdc8" BIGINT -- TTATGCGACGCGCCGAAAGTATGCGTGACGGACTG,AGGCACGAGGCTGCCGATACGATCCCGAAACC,
"caaagccgcaacctcgccatatgcccgttcaaacgtaccgatataa" BIGINT,
"ggtttgttcgggaacgcgcgaccacctttacgccacagcggagaagaagtcata_3d468fe4" BIGINT -- GGTTTGTTCGGGAACGCGCGACCACCTTTACGCCACAGCGGAGAAGAAGTCATA,TCCAAAAACGGAGGGATACCGGGCAGCATCCCGACCGCACCCATCGCC,AGTGCTGGAAGTCGATGCCGCACGCAAACGC,GAACCGCCCGCCGCTTCGGATCCGTCCGGGGC,
"ctgaaagaaggctgtcccaacaaatccgccggatcggtcttg" BIGINT,
"gaaaaaaaagaaaagaaaaaggaaaaggcggaagcca" BIGINT,
"tggaaatattcaaatttcctccaataatattaacga" BIGINT,
"cggatgtcggcaatatcggtgcatttttgccgacgtggccgctgtttgcc_aaa_9620f718" BIGINT -- CGGATGTCGGCAATATCGGTGCATTTTTGCCGACGTGGCCGCTGTTTGCC,AAACAACAGACAAATCAAACTGATTGCCGCCTCC,
"gaacaataacattgtcagcttggcgaagcaggc" BIGINT,
"taaaaagggcactcatggagctgaccgtccact" BIGINT,
"gcaagtactgccgcaccgacgaaaaacgggcgcatagggtgggtaa" BIGINT,
"gccacgctttgcagcacgttttcaaatttcagaagctcggcggcaagc" BIGINT,
"acgccgcacaaaaaagcggcaataggcaggcaatcagaatgcaccaa" BIGINT,
"ttctcgccctcggaagtcagcttcagataaacgcgccgt" BIGINT,
"ttttggattggggaaaaatgcatgaggtggaaattaccgaaaccgatcctttaacgggggaaa" BIGINT,
"gcggtggaaaccttgtgcgaaggcagccccgaa_agcttggcgccggcgatgct_b95a35f4" BIGINT -- GCGGTGGAAACCTTGTGCGAAGGCAGCCCCGAA,AGCTTGGCGCCGGCGATGCTTGCCTTTAAAGGGCGCAA,
"gcggaatccactcgtggaactcggtaaattgatagccgccgctcaaacggtcgaaaccg" BIGINT,
"gcagcaccatttcttttgcagccgccgccgcgtggaacag_ttttattttcttt_770e5101" BIGINT -- GCAGCACCATTTCTTTTGCAGCCGCCGCCGCGTGGAACAG,TTTTATTTTCTTTACATTATTGATATTGCCGTTCCATTTCCTGCGAAC,
"aacttcagattctacttttgctgcggtttcctgaacttggg_caaatcctgtgc_99d2be32" BIGINT -- AACTTCAGATTCTACTTTTGCTGCGGTTTCCTGAACTTGGG,CAAATCCTGTGCCGCCGCCGCAAAAACAATCCGCTT,
"aatttccgttaccccgaccaaatctctggcgaccgac" BIGINT,
"gaaaaagaacagacaggctgccaaagccccgaaggaaaatcaaaa" BIGINT,
"gatgaggacaggttgaaacagtttctcgaacggtaaaaaa" BIGINT,
"caatatccgatttatttccaacatcacggagagccgtatgaaa" BIGINT,
"ggcagattccccatttgggttcggaacgcgcgcacgc" BIGINT,
"caaactgcacgcgccgcccgtccgacctcggcatatccg_acgtgcctgccccg_fe23213c" BIGINT -- CAAACTGCACGCGCCGCCCGTCCGACCTCGGCATATCCG,ACGTGCCTGCCCCGGATTTGTTCCGCATCGGGCAT,
"gatagccttaatttcaaaaggacgattaatggatacacaaa" BIGINT,
"ctggcgaatgggtactggtacaaaatcagggtcgc" BIGINT,
"cacaggaacagaccgcctcgggcgcatcctac" BIGINT,
"agatcgggcgaatgtgctgccaaacccgccgcc" BIGINT,
"gaacccttcagcgtgatggacttcatccaagccaatccgcgccat_tgcagttc_c61b0941" BIGINT -- GAACCCTTCAGCGTGATGGACTTCATCCAAGCCAATCCGCGCCAT,TGCAGTTCGGTGGTGGCTTTGTAAAGCAGGAAAATACCGCCC,
"tacgtgaagaacaaaaagccgcgcagtaggcccgtttgaaaaatgccgtctg" BIGINT,
"gttcaaggtgttaatcctaacactgaagaagccgacagccgtcaagccag" BIGINT,
"aatgcgttgtcttgggctacctctggcggcgctggttttaaaggttctcgtaaa_f6ecaa2e" BIGINT -- AATGCGTTGTCTTGGGCTACCTCTGGCGGCGCTGGTTTTAAAGGTTCTCGTAAAAGTACAC,CGTAGTGGACTACAACGTCAAAGTCCGTGTGAAAGCCGATGGTTCGGATGTG,GCTCGCGGATAAGGTTCTCAGGTTTCGCTTCACC,CAGCTCATACCGAACCGAAACCGTGCGCGGCGAAGATTTAAACGCCGTACGCATCATCGGA,TTCGCGTTGTTTTACAACGGAATAATGCGTCGAGCCTGAGTCGAA,ATCGACTACGGCACTTACCCCTTCGTTACCTCGTCCAAC,
"aaatatactaggtatggtactgttttgttagcaattcttcaa" BIGINT,
"tgtgccacgatattctggggcagaccgcgctggtggatttggca" BIGINT,
"acatacgggccgcgcccatggtcttcacccg" BIGINT,
"tatggtcgaagaacacctgccgctcatcacgcagcag" BIGINT,
"accaaccggtatcgatttaaccgatttccttaatatt_cacactcaaggacaac_6ca228b5" BIGINT -- ACCAACCGGTATCGATTTAACCGATTTCCTTAATATT,CACACTCAAGGACAACAACATGGCAGCCTCGCCCGAAGCAAAATTCACCGAAGAAA,GTGGGATAATTGTTTTTAACTGTTCTTTTTAAAACTTGACATCATGGCGTGATGCCAACAA,
"cgaggctgataaattcataatgagccttacgcgcctcgcggtaaagctgctgca_e67b057e" BIGINT -- CGAGGCTGATAAATTCATAATGAGCCTTACGCGCCTCGCGGTAAAGCTGCTGCAAAATC,AAAGTTTCCGAACGCCTTTGCACACGGTTTCCACGTCA,
"ggcagcatcagcaggcgcagcaccaaagcccgccccgg" BIGINT,
"tccgccgtgtccaaacccaaagccagcccggcattgttgatgag" BIGINT,
"taaccctgttttattttcccattctcgttgcg_acaaaaaaccgctttgtgtaa_1e6267b3" BIGINT -- TAACCCTGTTTTATTTTCCCATTCTCGTTGCG,ACAAAAAACCGCTTTGTGTAAGGCGGTTGCAAAAAAA,ATCCCCTTTCGGGTATCCGGATTTTCCGTTG,
"gttaccgcgcccaaaatggtggaggggtcgcaaccgagtacgacggcgacgggatacggcg" BIGINT,
"gatttgcgcggcagatgcaaaaccataggcgcgctgaccg" BIGINT
);
CREATE TABLE y_test_augmented_azm (
"unnamed_0" BIGINT -- Unnamed: 0,
"sample_id" VARCHAR,
"azm_sr" DOUBLE
);
CREATE TABLE y_test_augmented_cip (
"unnamed_0" BIGINT -- Unnamed: 0,
"sample_id" VARCHAR,
"cip_sr" DOUBLE
);
Anyone who has the link will be able to view this.