|
3 | 3 | // Information about enclone tests.
|
4 | 4 | pub mod main_testlist;
|
5 | 5 |
|
6 |
| -pub fn enclone_testdata() -> String { |
7 |
| - include_str!["enclone.testdata"].to_string() |
8 |
| -} |
9 |
| -pub fn enclone_testdata_public_bcr_human() -> String { |
10 |
| - include_str!["testdata.public.bcr.human"].to_string() |
11 |
| -} |
12 |
| -pub fn enclone_testdata_public_tcr_human() -> String { |
13 |
| - include_str!["testdata.public.tcr.human"].to_string() |
14 |
| -} |
15 |
| -pub fn enclone_testdata_public_tcr_mouse() -> String { |
16 |
| - include_str!["testdata.public.tcr.mouse"].to_string() |
17 |
| -} |
18 |
| -pub fn enclone_testdata_public_gex_human() -> String { |
19 |
| - include_str!["testdata.public.gex.human"].to_string() |
20 |
| -} |
21 |
| - |
22 | 6 | pub const TEST_FILES_VERSION: u8 = 15;
|
23 | 7 |
|
24 |
| -// Unaccounted time test. This is separated out so that we can avoid running it in parallel with |
25 |
| -// other tests, to reduce the sporadic failure rate. Also this is off in GitHub Actions. |
26 |
| - |
27 |
| -pub const UNAC_TESTS: [&str; 1] = [ |
28 |
| - // 1. enforce no unaccounted time |
29 |
| - r###"BCR=123085 COMPE UNACCOUNTED NOPRINT EXPECT_OK"###, |
30 |
| -]; |
31 |
| - |
32 |
| -// Tests that are affected by the D region alignment algorithm. All such tests should go here. |
33 |
| - |
34 |
| -pub const DTESTS: [&str; 15] = [ |
35 |
| - // 1. test ALIGN_2ND<n> |
36 |
| - r###"BCR=123085 CDR3=CKVMLYDSRGSDYYYVMDVW ALIGN_2ND1 CVARS=d1_name"###, |
37 |
| - // 2. test JALIGN_2ND<n> |
38 |
| - r###"BCR=123085 CDR3=CKVMLYDSRGSDYYYVMDVW JALIGN_2ND1 CVARS=d2_name"###, |
39 |
| - // 3. test ALIGN_JALIGN_CONSISTENCY |
40 |
| - r###"BCR=123085 CELLS=1 CHAINS=2 ALIGN1 JALIGN1 ALIGN_JALIGN_CONSISTENCY AMINO=cdr3 |
41 |
| - PLAIN NOPAGER EXPECT_OK"###, |
42 |
| - // 4. test D_INCONSISTENT, and lock number of inconsistencies |
43 |
| - r###"BCR=123085 D_INCONSISTENT CVARS=d1_name COMPLETE NGROUP"###, |
44 |
| - // 5. the JALIGN1 in this example had a boundary location that was off by one |
45 |
| - r###"BCR=165807 JALIGN1 AMINO=cdr3 CVARS=d1_score,d2_score CDR3=CAKEYYDFWSGYSDVRGVIPNIDYW"###, |
46 |
| - // 6. the JALIGN1 in this example had a boundary location that was off by one |
47 |
| - r###"BCR=123085 CELLS=2 JALIGN1 AMINO=cdr3 CVARS=d1_name CDR3=CAKAGPTESGYYVWYFDLW"###, |
48 |
| - // 7. test d_inconsistent_{%,n} |
49 |
| - r###"BCR=123085 GVARS=d_inconsistent_%,d_inconsistent_n NOPRINT SUMMARY SUMMARY_CLEAN"###, |
50 |
| - // 8. test ALIGN<n> |
51 |
| - r###"BCR=123085 CDR3=CKVMLYDSRGSDYYYVMDVW ALIGN1 CVARS=d1_name"###, |
52 |
| - // 9. test ALIGN<n> and JALIGN<n>, case where there's a D segment |
53 |
| - r###"BCR=85333 ALIGN1 JALIGN1 CDR3=CARGYDFWSGYLVGNWAGDYYYYMDVW"###, |
54 |
| - // 10. test ALIGN<n> and JALIGN<n>, case where there is no D segment |
55 |
| - r###"BCR=85333 ALIGN1 JALIGN1 CDR3=CAKGKGFRNYYYYMDVW"###, |
56 |
| - // 11. test d1 etc. |
57 |
| - r###"BCR=123085 CVARS=d1_name,d2_name,d_Δ,d_delta AMINO=cdr3 CDR3=CARVRDILTGDYGMDVW"###, |
58 |
| - // 12. test GROUP_VDJ_REFNAME_HEAVY (deprecated but supported) |
59 |
| - r###"BCR=86237 GROUP_VDJ_REFNAME_HEAVY CDR3="CAKAVAGKAVAGGWDYW|CAKVSTGIAVAGPGDYW" COMPLETE"###, |
60 |
| - // 13. test GROUP_VJ_REFNAME_HEAVY (deprecated but supported) |
61 |
| - r###"BCR=86237 GROUP_VJ_REFNAME_HEAVY CDR3="CARGVLWFGELGAFDIW|CARAGLGVVLAARGAFDIW""###, |
62 |
| - // 14. test placement of indel, needed shifting right |
63 |
| - r###"BCR=123085 CELLS=1 CHAINS=2 AMINO=cdr3 JALIGN2 CDR3=CAKDKSRPPTHYYGSGSYYSRILDNW"###, |
64 |
| - // 15. test placement of indel, needed shifting left |
65 |
| - r###"BCR=123085 CELLS=1 CHAINS=2 AMINO=cdr3 JALIGN2 CDR3=CARMAQFYSGSGTYYIGPYYFEYW"###, |
66 |
| -]; |
67 |
| - |
68 |
| -// Tests that are affected by the grouping algorithm. All such tests should go here, if not |
69 |
| -// already in DTESTS. |
70 |
| - |
71 |
| -pub const GTESTS: [&str; 21] = [ |
72 |
| - // 1. test 5/8 for newline correctness (this grouping option deprecated but supported) |
73 |
| - r###"BCR=85333 GROUP_VJ_REFNAME MIN_GROUP=2 AMINO= PLAIN SET_IN_STONE"###, |
74 |
| - // 2. test 6/8 for newline correctness (this grouping option deprecated but supported) |
75 |
| - r###"BCR=85333 GROUP_VJ_REFNAME MIN_GROUP=2 AMINO= PLAIN NGROUP SET_IN_STONE"###, |
76 |
| - // 3. test 7/8 for newline correctness (this grouping option deprecated but supported) |
77 |
| - r###"BCR=85333 GROUP_VJ_REFNAME MIN_GROUP=2 AMINO= PLAIN HTML SET_IN_STONE"###, |
78 |
| - // 4. test 8/8 for newline correctness (this grouping option deprecated but supported) |
79 |
| - r###"BCR=85333 GROUP_VJ_REFNAME MIN_GROUP=2 AMINO= PLAIN HTML NGROUP SET_IN_STONE"###, |
80 |
| - // 5. test of GROUP |
81 |
| - r###"BCR=123085 GROUP=vj_refname,cdr3_aa_heavy≥80%,cdr3_aa_light≥80% CVARS=cdr3_len |
82 |
| - AMINO=cdr3 CDR3="CARHLQWELP.*W""###, |
83 |
| - // 6. test of GROUP |
84 |
| - r###"BCR=123085 GROUP=vj_refname,len,cdr3_len MIN_GROUP=2 MIN_CHAINS=2 CDR3="CQQSY.*TLATF" |
85 |
| - CVARS=cdr3_len"###, |
86 |
| - // 7. test of GROUP |
87 |
| - r###"BCR=123085 GROUP=cdr3_aa_heavy≥100% MIN_GROUP=2 MIN_CHAINS=2 CVARS=cdr3_len |
88 |
| - CDR3=CARPKSDYIIDAFDIW"###, |
89 |
| - // 8. test of GROUP |
90 |
| - r###"BCR=123085 GROUP=cdr3_aa_light≥100% MIN_GROUP=2 MIN_CHAINS=2 CVARS=cdr3_len |
91 |
| - CDR3=CQTWGTGPWVF"###, |
92 |
| - // 9. test of GROUP |
93 |
| - r###"BCR=123085 GROUP=vj_refname,aa_heavy≥100% MIN_GROUP=2 MIN_CHAINS=2 CVARS=cdr3_len |
94 |
| - CDR3=CARVPYYYDRSYYYYGMDVW"###, |
95 |
| - // 10. test of AGROUP |
96 |
| - r###"BCR=123085 AGROUP AG_CENTER=from_filters CDR3=CARHSYSSGWYDEWDYW |
97 |
| - AG_DIST_FORMULA=cdr3_edit_distance AG_DIST_BOUND=top=2"###, |
98 |
| - // 11. test of AGROUP |
99 |
| - r###"BCR=123085 AGROUP AG_CENTER=from_filters CDR3=CAKDGGEHYYDSSGYYASYYFDYW |
100 |
| - AG_DIST_FORMULA=cdr3_edit_distance AG_DIST_BOUND=max=14"###, |
101 |
| - // 12. test of AGROUP |
102 |
| - r###"BCR=123085 AGROUP AG_CENTER=from_filters CDR3=CAKDGGEHYYDSSGYYASYYFDYW |
103 |
| - AG_DIST_FORMULA=cdr3_edit_distance AG_DIST_BOUND=max=13"###, |
104 |
| - // 13. test of AGROUP |
105 |
| - r###"BCR=123085 AGROUP AG_CENTER=copy_filters MIN_CELLS=2 MAX_CELLS=2 |
106 |
| - AG_DIST_FORMULA=cdr3_edit_distance AG_DIST_BOUND=max=3 MIN_GROUP=2"###, |
107 |
| - // 14. test symmetric grouping stats |
108 |
| - r###"BCR=123085 GROUP=vj_refname,cdr3_aa_heavy≥80%,cdr3_aa_light≥80% NOPRINT |
109 |
| - SUMMARY SUMMARY_CLEAN"###, |
110 |
| - // 15. test of GROUP |
111 |
| - r###"BCR=123085 GROUP=cdr3_heavy≥100% MIN_GROUP=2 MIN_CHAINS=2 CVARS=cdr3_len |
112 |
| - CDR3=CARPKSDYIIDAFDIW"###, |
113 |
| - // 16. test of GROUP |
114 |
| - r###"BCR=123085 GROUP="cdr3_light>=100%" MIN_GROUP=2 MIN_CHAINS=2 CVARS=cdr3_len |
115 |
| - CDR3=CQTWGTGPWVF"###, |
116 |
| - // 17. test of GROUP |
117 |
| - r###"BCR=123085 GROUP=vj_refname,heavy≥96.6% MIN_GROUP=2 MIN_CHAINS=2 |
118 |
| - CDR3="CARVIVGPKKLEGRLYSSSLHFDCW|CARVIVGPEKQEGRLYSSSLHFDYW" POUT=stdout PCOLS=vj_seq1"###, |
119 |
| - // 18. test of GROUP |
120 |
| - r###"BCR=123085 GROUP=vj_heavy_refname,cdr3_heavy_len,cdr3_heavy≥80% LVARS=n,donors,dref |
121 |
| - CVARS=const,cdr3_len AMINO=cdr3 CHAINS=2 MIN_GROUP=2 |
122 |
| - CDR3="CARDLHGYDPYGMDVW|CARELRHYDTYGMDVW""###, |
123 |
| - // 19. test of GROUP |
124 |
| - r###"BCR=123085 GROUP=vj_refname,cdr3_light_len LVARS=n,donors,dref CVARS=const,cdr3_len |
125 |
| - AMINO=cdr3 CHAINS=2 MIN_GROUP=2 CDR3="CARESAVAGDMDVW|CARDYGDYRWWVDGMDVW""###, |
126 |
| - // 20. test of group |
127 |
| - r###"BCR=123085 GROUP=vj_refname GROUP_CDR3=CACFGRIGVVVRAAHYW"###, |
128 |
| - // 21. test of group, asserted at one time |
129 |
| - r###"BCR=123085 GROUP=vj_refname,cdr3_len MIN_GROUP=3 HONEY=out=stdout,color=var,u1 |
130 |
| - EXPECT_OK"###, |
131 |
| -]; |
132 |
| - |
133 |
| -// Crash tests. These are tests to make sure that certain options do not result in a crash, even |
134 |
| -// when run on a large and complex dataset. The options are in groups because not all are |
135 |
| -// compatible with each other. The datasets are defined by a single fixed list, to be enlarged |
136 |
| -// over time based on discovery of pathologies in particular PUBLIC datasets. |
137 |
| -// All run with certain shared options. |
138 |
| - |
139 |
| -pub const CRASH_DATA: &str = "BCR=\"45977;123085;testx/inputs/flaky\""; |
140 |
| -pub const CRASH_OPTS: &str = "NOPRINT BUILT_IN EXPECT_OK NO_PRE NFORCE"; |
141 |
| -pub const CRASH_SETS: [&str; 6] = [ |
142 |
| - /* 1 */ "CONP SEQC SUM MEAN BARCODES DIFF_STYLE=C1 GROUP_VJ_REFNAME", |
143 |
| - // |
144 |
| - /* 2 */ "CONX FULL_SEQC DIFF_STYLE=C2 POUT=stdout PCOLS=count_CAR", |
145 |
| - // |
146 |
| - /* 3 */ |
147 |
| - "AMINO=fwr1,cdr1,fwr2,cdr2,fwr3,cdr3,fwr4 CVARS=d1_name,d2_name,d_delta,d_Δ,cigar", |
148 |
| - // |
149 |
| - /* 4 */ |
150 |
| - "PLOT_BY_ISOTYPE=stdout MIN_CELLS=3 GROUP_VJ_REFNAME_HEAVY ALIGN1 JALIGN1", |
151 |
| - // |
152 |
| - /* 5 */ |
153 |
| - "GROUP_VDJ_REFNAME_HEAVY GVARS=d_inconsistent_%,d_inconsistent_n", |
154 |
| - // |
155 |
| - /* 6 */ |
156 |
| - "GROUP=vj_refname,cdr3_aa_heavy≥90%,cdr3_aa_light≥90%", |
157 |
| -]; |
158 |
| - |
159 |
| -// Test using datasets that are either in the extended public dataset collection, |
160 |
| -// or which require samtools. |
161 |
| - |
162 |
| -pub const EXTENDED_TESTS: [&str; 12] = [ |
163 |
| - // 1. Make sure that POUT works on full dataset. |
164 |
| - // If we experience failures on other PUBLIC ids, we can add them to this list. |
165 |
| - r###"BCR=86237 RE POUT=/dev/null NOPRINT EXPECT_OK NO_PRE NFORCE"###, |
166 |
| - // 2. tests nd2 |
167 |
| - r###"BCR=47199,47200,47212 AMINO=cdr3 NCROSS LVARS=nd2 CDR3=CVKGKSGSFWYYFENW |
168 |
| - NO_PRE NFORCE"###, |
169 |
| - // 3. test sec and mem [requires samtools] |
170 |
| - r###"BCR=123085 GEX=123217 LVARSP=sec,mem CDR3=CVKDRVTGTITELDYW"###, |
171 |
| - // 4. crashed at one point |
172 |
| - r###"BCR=128037,128040 GEX=127798,127801 LVARSP=pe1 NOPRINT EXPECT_OK NO_PRE NFORCE"###, |
173 |
| - // |
174 |
| - // 5. this added because it got better when a bug in bads detection was fixed |
175 |
| - r###"TCR=163914 CDR3=CASRLGGEETQYF NO_PRE NFORCE"###, |
176 |
| - // 6. Test PCHAINS=max. For this we need a clonotype having at least five chains, and the |
177 |
| - // question is whether the header line represents cvars for all the chains. The output of |
178 |
| - // this is expected to change whenever variables are added. |
179 |
| - r###"BCR=123085,123089,124547 NWEAK_CHAINS NDOUBLET MIN_CHAINS=5 POUT=stdout PCHAINS=max |
180 |
| - NOPRINT RE NO_PRE NFORCE"###, |
181 |
| - // 7. test MIN_GROUP_DONORS |
182 |
| - r###"BCR="40953;43899" MIX_DONORS MIN_GROUP=2 NO_PRE NFORCE |
183 |
| - GROUP="cdr3_len,cdr3_aa_heavy>=85%,cdr3_aa_light>=85%,vj_refname" MIN_GROUP_DONORS=2"###, |
184 |
| - // 8. this asserted at one point |
185 |
| - r###"BUILT_IN GROUP=vj_refname,cdr3_aa_heavy≥90% MIN_CHAINS_EXACT=2 MIN_GROUP=2 |
186 |
| - KEEP_CLONO_IF_CELL_MEAN="cdr3_len1>=18" BCR=1018096-1018098 JALIGN1 NO_PRE NFORCE |
187 |
| - EXPECT_OK"###, |
188 |
| - // 9. this clonotype included a junk chain before we made a change, and test "/outs" |
189 |
| - r###"TCR=163911/outs CDR3=CAPSAGDKIIF AMINO=donor NO_PRE NFORCE"###, |
190 |
| - // 10. test case where digit rows are just barely present |
191 |
| - r###"TCR=163911 CDR3=CASSLVQPSTDTQYF AMINO=donor NO_PRE NFORCE"###, |
192 |
| - // 11. this added because it got better when a noise filter was added, also tests u_max |
193 |
| - r###"TCR=163914 CDR3=CASSLVQPSTDTQYF CVARSP=u_max NO_PRE NFORCE"###, |
194 |
| - // 12. this added because it got better when a noise filter was added; also test FASTA |
195 |
| - r###"TCR=163914 CDR3=CAFRGGSYIPTF FASTA=stdout NO_PRE NFORCE"###, |
196 |
| -]; |
197 |
| - |
198 |
| -// Tests of internal features. |
199 |
| - |
200 |
| -pub const INTERNAL_TESTS: [&str; 3] = [ |
201 |
| - // 1. gave wrong result |
202 |
| - r###"123085 CDR3=CARDRIAGRFGYGMDVW NFORCE"###, |
203 |
| - // 2. test human + IMGT; note that specifying by number forces BCR+TCR reference checks |
204 |
| - r###"123085 REQUIRE_UNBROKEN_OK IMGT ACCEPT_BROKEN EXPECT_NULL"###, |
205 |
| - // 3. this crashed; it is not exactly an internal feature test but uses an internal feature |
206 |
| - // (IMGT) to exhibit the phenomenon |
207 |
| - r###"BCR=123085 IMGT RE ACCEPT_BROKEN POUT=stdout PCELL BARCODE=AGCAGCCCATTAGGCT-1 |
208 |
| - EXPECT_OK"###, |
209 |
| -]; |
210 |
| - |
211 |
| -// List of examples in documentation. |
212 |
| - |
213 |
| -pub const EXAMPLES: [&str; 2] = [ |
214 |
| - // 1. |
215 |
| - r###"BCR=123089 CDR3=CARRYFGVVADAFDIW"###, |
216 |
| - // 2. |
217 |
| - r###"BCR=123085 GEX=123217 LVARSP=gex,IGHV2-5_g_μ CDR3=CALMGTYCSGDNCYSWFDPW"###, |
218 |
| -]; |
219 |
| - |
220 | 8 | // List of examples on site.
|
221 | 9 |
|
222 | 10 | pub const SITE_EXAMPLES: [(&str, &str); 28] = [
|
|
0 commit comments