Skip to content

Commit 7cef793

Browse files
kl-metapool beta.zip (#141)
* kl-metapool beta.zip * 100 -> 90 * illumina/good_sheet1.csv 100 -> 90 * good-sample-sheet_w_context.csv * good_sheet_w_replicates.csv * good_sheet1.csv * duplicate_sample-sample-sheet.csv * metatranscriptomic * 100->0 * fix errors * fix TestPipeline.test_generate_sample_information_files_multiple_preps_w_context * kl-metapool main * scipy * sklearn * sklearn -> scikit-learn * rm changes to conda install * Remove contains_replicates column in bioinformatics table * Change sheet type to standard_metat for metatv0 * Put back sheet type as standard_metag * add Library Well --------- Co-authored-by: Amanda Birmingham <[email protected]>
1 parent 6e92d3f commit 7cef793

18 files changed

+50
-867
lines changed

src/qp_klp/StandardMetagenomicWorkflow.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -221,6 +221,7 @@ def __init__(self, **kwargs):
221221
'Project Plate': '',
222222
'Project Name': project_name,
223223
'Well': '',
224+
'Library Well': '',
224225
'# Reads': f'{_d.reads.sum()}',
225226
'Lane': '1'}
226227
data.append(sample)

tests/data/bad-sample-sheet-bool-test.csv

Lines changed: 0 additions & 816 deletions
This file was deleted.

tests/data/bad-sample-sheet-metagenomics.csv

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
[Header],,,,,,,,,,,
22
IEMFileVersion,4,,,,,,,,,,
33
SheetType,standard_metag,,,,,,,,,,
4-
SheetVersion,100,,,,,,,,,,
4+
SheetVersion,90,,,,,,,,,,
55
Investigator Name,Knight,,,,,,,,,,
66
Experiment Name,RKL0042,,,,,,,,,,
77
Date,2020-02-26,,,,,,,,,,
@@ -19,7 +19,7 @@ Chemistry,Default,,,,,,,,,,
1919
ReverseComplement,0,,,,,,,,,,
2020
,,,,,,,,,,,
2121
[Data],,,,,,,,,,,
22-
Lane,Sample_ID,Sample_Name,Sample_Plate,well_id_384,I7_Index_ID,index,I5_Index_ID,index2,Sample_Project,syndna_pool_number,Well_description
22+
Lane,Sample_ID,Sample_Name,Sample_Plate,Sample_Well,I7_Index_ID,index,I5_Index_ID,index2,Sample_Project,syndna_pool_number,Well_description
2323
1,CDPH-SAL__Salmonella__Typhi__MDL-143,CDPH-SAL..Salmonella..Typhi..MDL-143,StudyB_11661_P40,A1,iTru7_107_07,CCGACTAT,iTru5_01_A,ACCGACAA,StudyB_11661,pool1,CDPH-SAL_Salmonella Typhi_MDL-143
2424
1,CDPH-SAL_Salmonella_Typhi_MDL-144,CDPH-SAL.Salmonella.Typhi.MDL-144,StudyB_11661_P40,C1,iTru7_107_08,CCGACTAT,iTru5_02_A,CTTCGCAA,StudyB_11661,pool2,CDPH-SAL_Salmonella Typhi_MDL-144
2525
1,CDPH-SAL_Salmonella_Typhi_MDL-145,CDPH-SAL.Salmonella.Typhi.MDL-145,StudyB_11661_P40,E1,iTru7_107_09,GCCTTGTT,iTru5_03_A,AACACCAC,StudyB_11661,pool1,CDPH-SAL_Salmonella Typhi_MDL-145

tests/data/duplicate_sample-sample-sheet.csv

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
[Header],,,,,,,,,,,
22
IEMFileVersion,4,,,,,,,,,,
33
SheetType,standard_metag,,,,,,,,,,
4-
SheetVersion,100,,,,,,,,,,
4+
SheetVersion,90,,,,,,,,,,
55
Investigator Name,Knight,,,,,,,,,,
66
Experiment Name,RKL0042,,,,,,,,,,
77
Date,2020-02-26,,,,,,,,,,
@@ -19,7 +19,7 @@ Chemistry,Default,,,,,,,,,,
1919
ReverseComplement,0,,,,,,,,,,
2020
,,,,,,,,,,,
2121
[Data],,,,,,,,,,,
22-
Lane,Sample_ID,Sample_Name,Sample_Plate,well_id_384,I7_Index_ID,index,I5_Index_ID,index2,Sample_Project,syndna_pool_number,Well_description
22+
Lane,Sample_ID,Sample_Name,Sample_Plate,Sample_Well,I7_Index_ID,index,I5_Index_ID,index2,Sample_Project,syndna_pool_number,Well_description
2323
1,CDPH-SAL_Salmonella_Typhi_MDL-143,CDPH-SAL.Salmonella.Typhi.MDL-143,StudyB_11661_P40,A1,iTru7_107_07,CCGACTAT,iTru5_01_A,ACCGACAA,StudyB_11661,pool1,CDPH-SAL_Salmonella Typhi_MDL-143
2424
1,CDPH-SAL_Salmonella_Typhi_MDL-144,CDPH-SAL.Salmonella.Typhi.MDL-144,StudyB_11661_P40,C1,iTru7_107_08,CCGACTAT,iTru5_02_A,CTTCGCAA,StudyB_11661,pool2,CDPH-SAL_Salmonella Typhi_MDL-144
2525
1,CDPH-SAL_Salmonella_Typhi_MDL-145,CDPH-SAL.Salmonella.Typhi.MDL-145,StudyB_11661_P40,E1,iTru7_107_09,GCCTTGTT,iTru5_03_A,AACACCAC,StudyB_11661,pool1,CDPH-SAL_Salmonella Typhi_MDL-145

tests/data/good-sample-sheet.csv

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
[Header],,,,,,,,,,,
22
IEMFileVersion,4,,,,,,,,,,
33
SheetType,standard_metag,,,,,,,,,,
4-
SheetVersion,100,,,,,,,,,,
4+
SheetVersion,90,,,,,,,,,,
55
Investigator Name,Knight,,,,,,,,,,
66
Experiment Name,RKL0042,,,,,,,,,,
77
Date,2020-02-26,,,,,,,,,,
@@ -19,7 +19,7 @@ Chemistry,Default,,,,,,,,,,
1919
ReverseComplement,0,,,,,,,,,,
2020
,,,,,,,,,,,
2121
[Data],,,,,,,,,,,
22-
Lane,Sample_ID,Sample_Name,Sample_Plate,well_id_384,I7_Index_ID,index,I5_Index_ID,index2,Sample_Project,syndna_pool_number,Well_description
22+
Lane,Sample_ID,Sample_Name,Sample_Plate,Sample_Well,I7_Index_ID,index,I5_Index_ID,index2,Sample_Project,syndna_pool_number,Well_description
2323
1,CDPH-SAL__Salmonella__Typhi__MDL-143,CDPH-SAL..Salmonella..Typhi..MDL-143,StudyB_11661_P40,A1,iTru7_107_07,CCGACTAT,iTru5_01_A,ACCGACAA,StudyB_11661,pool1,CDPH-SAL_Salmonella Typhi_MDL-143
2424
1,CDPH-SAL_Salmonella_Typhi_MDL-144,CDPH-SAL.Salmonella.Typhi.MDL-144,StudyB_11661_P40,C1,iTru7_107_08,CCGACTAT,iTru5_02_A,CTTCGCAA,StudyB_11661,pool2,CDPH-SAL_Salmonella Typhi_MDL-144
2525
1,CDPH-SAL_Salmonella_Typhi_MDL-145,CDPH-SAL.Salmonella.Typhi.MDL-145,StudyB_11661_P40,E1,iTru7_107_09,GCCTTGTT,iTru5_03_A,AACACCAC,StudyB_11661,pool1,CDPH-SAL_Salmonella Typhi_MDL-145

tests/data/good-sample-sheet_w_context.csv

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -805,10 +805,10 @@ Lane,Sample_ID,Sample_Name,Sample_Plate,well_id_384,I7_Index_ID,index,I5_Index_I
805805
1,EP479894B04,EP479894B04,StudyA_13059_P4,P24,iTru7_107_08,AGCTAACC,iTru5_124_H,AACGCCTT,StudyA_13059,pool1,EP479894B04
806806
,,,,,,,,,,,
807807
[Bioinformatics],,,,,,,,,,,
808-
Sample_Project,QiitaID,BarcodesAreRC,ForwardAdapter,ReverseAdapter,HumanFiltering,library_construction_protocol,experiment_design_description,,,,
809-
StudyA_13059,13059,FALSE,AACC,GGTT,FALSE,Nextera,Equipment,,,,
810-
StudyB_11661,11661,FALSE,AACC,GGTT,FALSE,Nextera,Equipment,,,,
811-
StudyC_6123,6123,FALSE,AACC,GGTT,TRUE,Nextera,Equipment,,,,
808+
Sample_Project,QiitaID,BarcodesAreRC,ForwardAdapter,ReverseAdapter,HumanFiltering,library_construction_protocol,experiment_design_description,contains_replicates,,,
809+
StudyA_13059,13059,FALSE,AACC,GGTT,FALSE,Nextera,Equipment,False,,,
810+
StudyB_11661,11661,FALSE,AACC,GGTT,FALSE,Nextera,Equipment,False,,,
811+
StudyC_6123,6123,FALSE,AACC,GGTT,TRUE,Nextera,Equipment,False,,,
812812
,,,,,,,,,,,
813813
[Contact],,,,,,,,,,,
814814
Email,Sample_Project,,,,,,,,,,

tests/data/good_sheet_w_replicates.csv

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,7 @@ Chemistry,Default,,,,,,,,,,
1919
ReverseComplement,0,,,,,,,,,,
2020
,,,,,,,,,,,
2121
[Data],,,,,,,,,,,
22-
Lane,orig_name,Sample_ID,Sample_Name,source_well_384,destination_well_384,Sample_Plate,well_id_384,I7_Index_ID,index,I5_Index_ID,index2,Sample_Project,Well_description
22+
Lane,orig_name,Sample_ID,Sample_Name,well_id_384,destination_well_384,Sample_Plate,Sample_Well,I7_Index_ID,index,I5_Index_ID,index2,Sample_Project,Well_description
2323
1,BLANK.43.12G,BLANK_43_12G_A1,BLANK.43.12G.A1,A1,A1,StudyB_11661_P43,A1,iTru7_114_08,CCGACTAT,iTru5_01_A,AAGGCTGA,StudyB_11661,blue_quadrant
2424
1,BLANK.43.12H,BLANK_43_12H_A3,BLANK.43.12H.A3,A3,A3,StudyB_11661_P43,A3,iTru7_114_09,ACCGACAA,iTru5_02_A,CGATCGAT,StudyB_11661,blue_quadrant
2525
1,RMA.KHP.rpoS.Mage.Q97D,RMA_KHP_rpoS_Mage_Q97D_A5,RMA.KHP.rpoS.Mage.Q97D.A5,A5,A5,StudyB_11661_P43,A5,iTru7_114_10,CCGACTAT,iTru5_03_A,TTACCGAG,StudyB_11661,blue_quadrant

tests/data/good_sheet_w_replicates_and_context_demux_1.csv

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -42,11 +42,11 @@ EP159692B04_C7,EP159692B04,C7,iTru7_108_10,AAGCACTG,iTru5_02_B,GTGGTATG,ProjectN
4242
EP987683A01_C9,EP987683A01,C9,iTru7_108_11,CCAAGCAA,iTru5_03_B,TGAGCTGT,ProjectN_13059,C9,ProjectN_13059_P1,C9,blue_quadrant
4343
,,,,,,,,,,,
4444
[Bioinformatics],,,,,,,,,,,
45-
Sample_Project,QiitaID,BarcodesAreRC,ForwardAdapter,ReverseAdapter,HumanFiltering,library_construction_protocol,experiment_design_description,,,,
46-
ProjectF_11661,11661,False,AACC,GGTT,False,Nextera,Equipment,,,,
47-
ProjectN_13059,13059,False,AACC,GGTT,False,Knight Lab Kapa HP,Equipment,,,,
48-
TMI_10317,10317,False,AACC,GGTT,False,Knight Lab Kapa HP,Eqiiperiment,,,,
49-
Other_11223,11223,False,AACC,GGTT,False,Knight Lab Kapa HP,Eqiiperiment,,,,
45+
Sample_Project,QiitaID,BarcodesAreRC,ForwardAdapter,ReverseAdapter,HumanFiltering,library_construction_protocol,experiment_design_description,contains_replicates,,,
46+
ProjectF_11661,11661,False,AACC,GGTT,False,Nextera,Equipment,False,,,
47+
ProjectN_13059,13059,False,AACC,GGTT,False,Knight Lab Kapa HP,Equipment,False,,,
48+
TMI_10317,10317,False,AACC,GGTT,False,Knight Lab Kapa HP,Eqiiperiment,False,,,
49+
Other_11223,11223,False,AACC,GGTT,False,Knight Lab Kapa HP,Eqiiperiment,False,,,
5050
,,,,,,,,,,,
5151
[Contact],,,,,,,,,,,
5252
Email,Sample_Project,,,,,,,,,,

tests/data/good_sheet_w_replicates_and_context_demux_2.csv

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -42,11 +42,11 @@ LP127890A01_C6,LP127890A01,C6,iTru7_108_09,TCTATAGG,iTru5_01_B,AGTCGCAA,ProjectN
4242
EP159692B04_C8,EP159692B04,C8,iTru7_108_10,AAGTTATG,iTru5_02_B,GTGGAATG,ProjectN_13059,C8,ProjectN_13059_P1,C7,green_quadrant
4343
,,,,,,,,,,,
4444
[Bioinformatics],,,,,,,,,,,
45-
Sample_Project,QiitaID,BarcodesAreRC,ForwardAdapter,ReverseAdapter,HumanFiltering,library_construction_protocol,experiment_design_description,,,,
46-
ProjectF_11661,11661,False,AACC,GGTT,False,Nextera,Equipment,,,,
47-
ProjectN_13059,13059,False,AACC,GGTT,False,Knight Lab Kapa HP,Equipment,,,,
48-
TMI_10317,10317,False,AACC,GGTT,False,Knight Lab Kapa HP,Eqiiperiment,,,,
49-
Other_11223,11223,False,AACC,GGTT,False,Knight Lab Kapa HP,Eqiiperiment,,,,
45+
Sample_Project,QiitaID,BarcodesAreRC,ForwardAdapter,ReverseAdapter,HumanFiltering,library_construction_protocol,experiment_design_description,contains_replicates,,,
46+
ProjectF_11661,11661,False,AACC,GGTT,False,Nextera,Equipment,False,,,
47+
ProjectN_13059,13059,False,AACC,GGTT,False,Knight Lab Kapa HP,Equipment,False,,,
48+
TMI_10317,10317,False,AACC,GGTT,False,Knight Lab Kapa HP,Eqiiperiment,False,,,
49+
Other_11223,11223,False,AACC,GGTT,False,Knight Lab Kapa HP,Eqiiperiment,False,,,
5050
,,,,,,,,,,,
5151
[Contact],,,,,,,,,,,
5252
Email,Sample_Project,,,,,,,,,,

tests/data/good_sheet_w_replicates_and_context_demux_3.csv

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -42,11 +42,11 @@ LP127890A01_D6,LP127890A01,D6,iTru7_108_09,TGTCTAGG,iTru5_01_B,AGTGGCAA,ProjectN
4242
EP159692B04_D8,EP159692B04,D8,iTru7_108_10,AGGCACTG,iTru5_02_B,GTGGTATG,ProjectN_13059,D8,ProjectN_13059_P1,C7,yellow_quadrant
4343
,,,,,,,,,,,
4444
[Bioinformatics],,,,,,,,,,,
45-
Sample_Project,QiitaID,BarcodesAreRC,ForwardAdapter,ReverseAdapter,HumanFiltering,library_construction_protocol,experiment_design_description,,,,
46-
ProjectF_11661,11661,False,AACC,GGTT,False,Nextera,Equipment,,,,
47-
ProjectN_13059,13059,False,AACC,GGTT,False,Knight Lab Kapa HP,Equipment,,,,
48-
TMI_10317,10317,False,AACC,GGTT,False,Knight Lab Kapa HP,Eqiiperiment,,,,
49-
Other_11223,11223,False,AACC,GGTT,False,Knight Lab Kapa HP,Eqiiperiment,,,,
45+
Sample_Project,QiitaID,BarcodesAreRC,ForwardAdapter,ReverseAdapter,HumanFiltering,library_construction_protocol,experiment_design_description,contains_replicates,,,
46+
ProjectF_11661,11661,False,AACC,GGTT,False,Nextera,Equipment,False,,,
47+
ProjectN_13059,13059,False,AACC,GGTT,False,Knight Lab Kapa HP,Equipment,False,,,
48+
TMI_10317,10317,False,AACC,GGTT,False,Knight Lab Kapa HP,Eqiiperiment,False,,,
49+
Other_11223,11223,False,AACC,GGTT,False,Knight Lab Kapa HP,Eqiiperiment,False,,,
5050
,,,,,,,,,,,
5151
[Contact],,,,,,,,,,,
5252
Email,Sample_Project,,,,,,,,,,

0 commit comments

Comments
 (0)