From 8911a6f7eff40331b0d207228404c9fb6842d98f Mon Sep 17 00:00:00 2001 From: Dilawar Singh <dilawar@subcom.tech> Date: Sat, 30 Jul 2022 15:29:40 +0530 Subject: [PATCH] Added the pipeline. Run `copr .` --- data/non-curated/SampleInputFileLinks.txt | 12 ------------ .../TrainingDataSet_Process_Codes.xlsx | Bin 11017 -> 0 bytes vendor/shodhka/test_20220727/README.md | 15 ++++++++++----- vendor/shodhka/test_20220727/run.copr.sh | 11 +++++++++++ 4 files changed, 21 insertions(+), 17 deletions(-) delete mode 100644 data/non-curated/SampleInputFileLinks.txt delete mode 100644 data/non-curated/TrainingDataSet_Process_Codes.xlsx create mode 100755 vendor/shodhka/test_20220727/run.copr.sh diff --git a/data/non-curated/SampleInputFileLinks.txt b/data/non-curated/SampleInputFileLinks.txt deleted file mode 100644 index 0c16ca5..0000000 --- a/data/non-curated/SampleInputFileLinks.txt +++ /dev/null @@ -1,12 +0,0 @@ -ftp://ftp.sra.ebi.ac.uk/vol1/fastq/SRR118/096/SRR11862696/SRR11862696_1.fastq.gz -ftp://ftp.sra.ebi.ac.uk/vol1/fastq/SRR118/096/SRR11862696/SRR11862696_2.fastq.gz -ftp://ftp.sra.ebi.ac.uk/vol1/fastq/SRR118/097/SRR11862697/SRR11862697_1.fastq.gz -ftp://ftp.sra.ebi.ac.uk/vol1/fastq/SRR118/097/SRR11862697/SRR11862697_2.fastq.gz -ftp://ftp.sra.ebi.ac.uk/vol1/fastq/SRR118/099/SRR11862699/SRR11862699_1.fastq.gz -ftp://ftp.sra.ebi.ac.uk/vol1/fastq/SRR118/099/SRR11862699/SRR11862699_2.fastq.gz -ftp://ftp.sra.ebi.ac.uk/vol1/fastq/SRR118/082/SRR11862682/SRR11862682_1.fastq.gz -ftp://ftp.sra.ebi.ac.uk/vol1/fastq/SRR118/082/SRR11862682/SRR11862682_2.fastq.gz -ftp://ftp.sra.ebi.ac.uk/vol1/fastq/SRR118/091/SRR11862691/SRR11862691_1.fastq.gz -ftp://ftp.sra.ebi.ac.uk/vol1/fastq/SRR118/091/SRR11862691/SRR11862691_2.fastq.gz -ftp://ftp.sra.ebi.ac.uk/vol1/fastq/SRR118/092/SRR11862692/SRR11862692_1.fastq.gz -ftp://ftp.sra.ebi.ac.uk/vol1/fastq/SRR118/092/SRR11862692/SRR11862692_2.fastq.gz \ No newline at end of file diff --git a/data/non-curated/TrainingDataSet_Process_Codes.xlsx b/data/non-curated/TrainingDataSet_Process_Codes.xlsx deleted file mode 100644 index 9274d9783e06864b6f3e6a3af5613f3def54ba61..0000000000000000000000000000000000000000 GIT binary patch literal 0 HcmV?d00001 literal 11017 zcmeHt1y@|zwsj%Fox<JS2`<6i-QC?u@Zbap?(Py?f)iW=f#B{C2oT)it90Lc(@p2S zAMn0=YK%H{#;G-{&fas$UUMtTKtKWkPyiSJ06+qW{1zGM3kCp0z5oEw0ZU*yA`bSh zX7;WIs;?c*T=W<{?QDtj=D?_P0N|kS|M&PmHUb}1hwQtVQQ9^31w}j5!vjRr)F6@c zq8ZT6A!PYb-t{)}K?HXmlhc%_T9M;2hSy%(`EH)L8emQ!f#X`Ju*gD@f~Rxaedoa- zdN+G5Bq}*<t;Pjk$_0q{wsmRV#^w1bOhZRjOn!@~u$Mkm*=U1L^Rd=BSGD)O5kvbh zhc%)zJNDAZs1~>kiyF2ut8Yl+0w%Ei`;A+^snv(Dth6WEGF9qh_;?!QTxW|5rntEZ zbxMfCTDzeyu(tqd6QoyWvDbzvETaKoQMobkC%oxM;v(!S0V}FQ2+jtQ#?W7MLt(x4 zDDt3M%M~9fMR|b!?WJQ6961s@NuCfu&(wxvL|IR>cIXtm_XG&b^KKTW-@47eE$u9n zs@h3Pn|)XE(1C3du3O`iX4G{6Q+%l%7|kytObk&xy3o|@pLo^MNPVza@-gJhI^#zx ztL4OmAMRr@gbT*2@o*|np9_|o@a4pTQuI`K$D0s*i(>8NNl2~i!gwYSi=Lh!0E&Ne z#RfHIvJ221S&*l}1IEA%oXu=qm>7S)6Xy;8*9HI2xL#!3xO@*YLjSR3o5<GPzP%(& zZegpeWGjg(;V1GVqK2q^@>f@vK@e}HO%^9EcgF>FR*rV8REhA7ndEy~sD*0SjJ;;9 zJu9-+k#memEv$e8xY77V8p|uT2A%~8>Bh5nCAII~;kG2)lNqxUC;;J4zB?DjGAj)m zSx&^`l$b3gZ1ab75-KwAO?O$tKzl)#3EcAC)P7`_bMR!^@i9)8k9?Jd&O741En*H| zI=)zvCOje)h;f$j6?N#2)C3}nazR(&{Hc-4iBu;1i{#oF-)e-*tAm38#%#;d>-I6e zjpCqnIn!&Su0CW{gWqypy0pmX7Ia4f0sz1Tz<_z$GW|(+4+m!(V+RMDpNZ#R)Q9{@ zeNc+}|NCf*`)u9Ij1Y7j+z~j@?iBZ^ILzZk6Wrdo2+drB7Aj|JQY!fRE-m4Rqq-pZ zOFlXK8Ox~o9ryVL0h!wh4RtL(WXnSOSOc8?m4e0<aaaRe%M}tvq-1pkBNNB?oQ=GK zY3nP}QZ8k~)SkcuRULeGGl3kL<o*F67hDs%z)Iv6F|D1O%*f7{IcZiAnMx=gJGi~R z2tzjxcB|}qQSUo^@xGkkzz>DP$LB;d)V{U4*T>WXfAKmiS2upWX8=M=RKN*egS=R# z8B*n*ZPb|cqfK|rH0o#g0aXE>LN*;H3YR)sg!exCw>5O^p9L?S)t~m^e-|aa2BM@s zg4nPPijv46N`RR2SI$H#%Q-AEBeWyW`JuRanDVNh1<dtLHfaXrQO{KJ+prSA*HDNk zn`4PQd0BZ`1zyy~OG<km$10?cbd(M`RLkRJPFi9rgKMV=fAf*{6VQj2k<P$sL1~zX znZ$BDXT7^M`-<arZ8jP}?C(xf(dIB4$*m<swlrFwb5g|Kh)Sr^YEjuh45tBhU1aWr ztzRupEk_m9@IZv1k|f<dHfRE|pg@diy{^<zu6khENTY_R@Ksc_{xH*0(ZfJR8GiRn z_%*e1nxQq%HMOpy@%zKelKu6hQ2626E0SXd%AR@!IG!sdBIQXzI=vLe!lu^bx+c7l z@v<Kn_DSRD@<Xb3NY(~738!kK(75hU{729<{qcKB_wt@6{%3g@J(u>1MnTTAa1dT9 zq7eO^#}0`CO?4qRS|WULSt$i2+wBxRETm^C5@h7(k25!&m*=QYri%FmFUJymDdl=7 z9R%j_gXtqEi|Y`D<MP#L9?&V)KZ-R;zh%xoBi5?iFiaiYT%(=u<2Kl8^&T;pklWJB zeq6|@MVk@SCPBUy@q5*bfwWAp%?df7Ctt?G<!0spn!$f&!WXJy?LQ+!A{+pK_~#tE zxW2YEbNLw++SGL%7MOv)+4WB-H~gOqgTSOqq^;_u^wdga7s{pZt9N9!Qjj<fJCEn2 zB;Vw!+I_?_CK@}r>2RsrtYfekBT&LfBo*oke~(YfnyOMG{pF+BesqkA6}|Il0Ws`C zEL^6Xpl=vmyUCWjT$uYBj1q-qg&X%t8?6p{bUC^f8rTz1+3AB(xw^g@?c1|qY^R;z z4#9J-B5=7)VK_bR)FqhAoUh`{QRN0>1m^y9uU6Q{$m5469Qgn>XaU@%FBzHhWyGSi z1GvpvwefKS#HRL~XbV_{$D2M7C~Ou^+$wZ%NO<2sEiZ;^`C_0HL>`jir47C{#7)+; z$rFXcE7oFir|4CCm3DBg*-o}V7wjQ~eSyGtfFew*hGaIqGv!$+_BAC|7(zl!!{%(d zHfXhQO50g;3s_a~2_Z?}X2Lg$B7sa*|LysLy1X7xb<0%d6cP~{^PQ3{Uz_BragCyW z0aA=kFVkez5dY^264=sV7?Y17OII8EOO3%~9DLii@F+o0FB2CTNu)m4Mk}=k%n`7{ zbv;^<K_^oz>N#A;l}x!;T$mRY$+s+z?ldlDv$ddQq^!K~oLLi>l4G?ij;OG#8n4`0 z$mb3@<qDc(7V!7f!QaNi|5%Ayj52Nh0blr3_PaH?J2gSAKoH~>!}~kQeLXx|#k$zT z7rg!@T}$OA$M>pDx-oV#-HVu^Cb#DF<EnGH-uxT$EMD)wF5L4+E_CwU5wM*`l(cuZ z9t!WZu2eU3T3^cTr{GZwWv|OCMn(|XMG2!N;|;T86rG8i&k58wbJPVkKz%B=_+bbH zM0+nH^4?YT%Xn(0urx_PS!@-2!YjhM6GWe?=#0y-=W?~kcM~}-Xp|r?(J@H9qr}D? z{6e9Dp^NgvjU$3`?`r$|S5M#6kfXuusHHBN@Fgeq^wx<rV~*@%6Tx$)M*!8?RH|)Y zSN<+iacW#5{kas>YzjSGTI>LFRt=|pHlO2QfpJbDZY|>VqI^=$N>PY|1E>G;fB;hH z<7?ox{hNL0Bf~I>BTG-*W-DOO*}9=SPN5RA*E!Gkfa4cJ&;n_e!>|eB>E#?EJ~ZU8 zjpH#t7GyoAANjc-ej8PN$(GL?K~WV3beHT`RCTd5GjnzMS8D#_g7rU%c{J&>LJu)^ z|1sqwGNMPW>S2Ud>$|k?YlUNHZy6pWbxJ-ZeeTq+wS*dq3_(xcv9iogHXsyO+1_W4 zn#huxhR=dPFhOC_4{zDELt5b&=fnw1C~7OpU!#YXDEd^^)S;bZTd;6n(Bi8e>$FY_ zojG#`AzZdUCyD`N+cYmgb<SI88^-)xk83%ih&DhI*9c9GKW?eF`>N7L#m^-}Zo9Kx z?CUv(7jW9%Sl56$fM=6@APc!aVL0g<K6^1vI+bdi@a2k#cGt51rEzabuC!myY;7-> zh*OgH2)mSCyWHA0l{w!>uFkLp+1qb9savj)d#uZLT&|{0MJ^YZUXu*qd1RQG`R#Q* zQm;H`Cds2O`{BbG8@gTUISG)cc|!*&FIGIQxLl8fUKfp^Iq={sdybj&Zle0N-8puX zjY(Nepg#SO4MiOemah)pvOIR#W+ZM|WpZ704~7)o-7?#~t||=Acx<=^CAxoxNM1Wu znJ&;o34<o>f1NOv|4dlW`>u#?W}w&=#G{C(SNu#cf`|$yX_MM6gz@bH)M9eX74X5U z4&Ut4_O|2rHb?p$Un!nBQY`&c3wZFB36^E`53dD=PN5pE{UsnQ17D2MSH_Ms2zhzw z@PQaj4EUO0CGrRC9^c;inrPV47=fL6sqoj#LpSg6zI-UNwmUU|u4j^OIHuq7(Fo+> zSJry`9_>TKXP@6WCV4s@B*h(LD3B+~Jt%f~>TfJ`;BlE{<AVfQWH&l;b_x5t5zuwk zB^v~d4J)XTf&CB4{vvCn+FvRH1KVb~G$^MCPrVvKD1;t?u`-4MVY`v|se*?qvTfC9 zf){fXv87j8k`V<n9#wL3m%@0Z3kkJavf-94YJ={{lLmrB0t_@PNgrQSsnIFlQX;f3 zdf!(IP(RqxlF)+%&lJ?xHtLAQ4$)0GvZ-WR8WpRytYZpXFtTQ1wmB9QMaOaJiy|g7 z9Ac>7`mw8O4eKtI-xs1*9E#PKG{1O~qu>?cJP__Cgc7Z%R%tOSkJS5WS?4bCl(b<e zKLbhjT6rIblki<aKe3T0gYy(Q{^R9FUCBX$uM{!=PL)dEOG$D4GuMa8r?tGNN+}ZQ zN99GL{U2(BdS)ckE(N<~Q1th4;>M3OR@dcsf`i@a)y8$E+!kkIti@YW*muOSvQm%6 zAFLnomBteFN4Z_c8CE|u@SqIR=Ex14M9<L%tU0sWcfm=gR6T?+%uEo1557;Iw>;~2 z5YO2&i_f9gZ2z7})k4N*T5t~RN+M*P?0~bfu+047&~tx);s>vOyx2f>*+F9RA+wi| z^%RkDgD(?Do5~w=he`OJL9^Y#Md7=TNWUoWNldH*C&?i~1^Oe(W7zv;UwvA`iw;Do zZ$IyPHC@JD+DY<?90Uml32w02cDU?*`QDDFyyCUXg?^JeGjQ6)F@&8)1&4+EHkcRu z^GetHN;Fc|m8f$rm1Yx7#_Nr>;7WfQ>_K9r0Rhnri^`t6(i!B~{R;G!q(e3Y+Rh^? zI*xk%A=1Lz8bhwYB7oyOL>vkr`qIA~1#mkIv4oOM2=;j$%)Uq-Ofi?R8ioMua2<@3 z1Ta+sO)mnVXM5j-NSYJL2fh}dYm|u)W5{z-2^}V5xz!VV_w8EVd-DyIj)=9A@N^$r zWTl_;(n8so)(N)~W>(Bq72JwB7_taoponzg_d96yV827oClI&)>HiBp8_p$A0Dune z&%WIsWw5KInVlKaAMbxS{dcYL_joUX9b_khkvmyCv!mo%FLfy53*eXS$|)K4C!{hW z@y5B*oZRu$5*58fg@u8=FT(MlAyus@7`LmmsNa%a7_7~+rOt)-*lX|ur<P^<&)Rp# zkLOqG29m3mkW1YnH-oB6tdf}$ZQ&)zI4CFTtyT%o;oKIbxgz?*YGF7JDdfM?-4XdZ z;vAj;Lg&EmsOLrGc-Oo;H0UYGEX9W?I0jJL(yO^d@d-DrobdC}f8b3T7pk5{kdVgO ziBUs-<fKGr?VfqnRDY#0)(Rvf%L)rYjk@c8IYUqG&PN9?S}W^~t1}SBVYg>7Di3un z@R1<`4T&kuUFvbZ?_or&J{d=;qes2wV5oDHkqvvCwszc;XO!0sfA&PX*$+0y8*jG4 zt-Uh&E*`*++a;;OSf=oC+0tVPq1=Bm8)`LEyI6bXN5s=U=57+*<I6V4!pBSo@2Xu9 z;Lp#V9`MIp4H3tdp0Ls<E0`VX)@~VTA;~%Zah8q2jLrJf22mWLve^90-FTH>%hgzS zZGfX8-tOUyl=K^|JKAAKHBHa}u!6Ao!Hp5_tQ^!)V<IKi$Z$8wA~3Aw9RA3JE32>6 z^VVqm+C$WoE-UqdS!9}6HdR#y_t&?5YzG(bii_W8WeePHpPy`gl@KiMVDEtd%Bl5e ztoof?eazPO<G(waj;|WM7VUd_{A$tpa9fB2b71*-Z+lkZ$@B4in=||ArUxCO4I@7n zjwl9&YR1jmc-fdFQVvSoB0BUWT?+wRlpP-E?+|#vh|IorL6JwPi+9k~iXIr0;;(^q z#a{V9tnX;NccYDB{fVsKGQF=Kpo{K9gGxxBSK55$nY&?6;%d9UC=r{qaAb_MASKKA z0I*?qPzE}&_o0G1a0BMpc;X((C=8Vnrog%&xhA({O*_#@5}cS^j@TJ-X!4*odO1jv zX>Hr+BTYMTx%{Iw69QOxa3zQvup({js=OBxxkKB4U{%Cxl8u0HQ$L*ds=A!(G2dv4 zM)#wg;!<qwdztkqzRkW87_}128&Q<#&lr^zKt?s8t?e=Q_3v(mU8GXVF&30IXBLZf zi+4i55Bo+Z$|pjoSkJcX0W&k{(}=PJwXI51K^5j%7lzo}7Lm%~cPGOmq*;al(^@o3 z5<Uhzt`EJcU9Q(*VPVV)M66i}zC)IFg=WZ0$5!ui4}Vkj<rrh(ah2}8vf=*H?KMMR z&ZIG0%2CtyBkxl4Ll%nkowwA95vj)-EHK9j88<kS@6E<N7YFiMvF6a1fROZl$puZ8 z&1@9Ha|rg(Wv_Wm`68*EH))zKNuNrUIPiSn`SgM$Y%{WWM$DYLW&6m4yqEQz&)m6K zegF@rXQ)b-+D&;Asa7z+jP5AO6UJQ8)F8qa%9J3bvZ_cdq0pR79fHMrKIJhkRVg?0 zftPG+1rWr&xGO6<<S_&nceE7-z8A}yRIRF|i@)JuYo|+DK%nj_j<SXNz_yH{>w%;Y z$(U)qJ6JC+oNCVli-V)p69<TL;@}lKcx~BcRf%_yV0|u1U8_mWZhhfr;xwTfxLm~X zMN$n8SBpw+vAl)ZOx$v%p33n}X!bh(jy$P*W0?Fp`drw+x3`^PwWFIs9*SrMV99y$ zWkQl%(G1evMGPU?#R1~VBIF;PUqG&BQp^IhUe68+O<s_14ne+eN^>t16Xo%N3|469 zzE)2&z^A952cKL<?x&iGVcgJxDN50ydk2V?0?+mwwqhTE?2z6OZp`w-3#N(JyQs^_ z5V7LTI|G<uh+&)o84LM}$+AzesTJl^NOGhlYlXQoBEZX`)XIxqPfK!t|IlKA7d}Xn z*Ib#JRu)!frOr|js)jQcw%r%e)@_YpOr2~UtWfBs;*3XEu{cMyr3Mb3H88H|Hm-yM zv_2SPw|;xlhyee2O#5P?26qi-YD|S3IDMsV&$*E_3uEH(#WQyp**(1uGmWy`r!ca< ztwYfPd+rBem;`jkHY2ryDed|rv3NDf{s_MmEnc<g(V4B)Cng)z_@alLtw#LLjoV=5 z<wMMjG8NjXW%Y(H&db)#2T3xS?%O0lOu`^D&UT(}U075tql}8CcQX{yO}8cPR=wS% z@yX<3Qo8zi33T%m5p6+M3;m10cmB70KWN*<8zwH{qO8j`9C;4k<gR-i3J;vwWa<xi z97L^%Eb=577OPzlROv8znyoT%=}SfCuTW2ANEdETX<t-+eUox%K@3?MZ7LMNCG+;~ z_lXTJk<R4?RMgHv0|3B36Pt^rk+YepimS7gy~Q6bfDdYV4(ZH5A5aUxaeKh3>y<V* zx}sbu&xM(a0ObY4=_jyqLv-7+f=*wgL!j(%);)Nrm-jfouFmYqa!uu0aAO>77V)?f zs$y1n#tErV=SSo^lmOMB-2$`>$~{qv78yamh(gsImu6YTQq?m=lhnj|%1Knj?X>xK zjg-=UjW3eqWTY5nq}B9{R^1?U(fd(N^EPRP&HzFK^SSvWSDz52O@<~l3)3%DJU2ft zFTRdc!`*b5G6naGOC8ga-3d||?IvJD7A>20#@CC;h&EYFnih0LUZmTJ<;;A`Urt@3 z;v)96Kb1NjPD*r&w_A*jbvGvE7AKqKQQ4%d>sDaA5Ba9GcGqcNP}!=pK>*UkmrnFW zX2DHL(<~H)+7C~`KGjHr#KkKr2|<E+w9rQ*q@j!>oX)V}9<SwPh?NhsSy;xLa4SY@ z(3C5$<vXWn^amOa_wLlsu^^tH8n;%z;Lj|~pAaFkBiau5?HQcQ*-8kq@)=l*#b!RH zWHH_5I!FkfGNw^BPGwv9@a|evcg6-V+;Fl(x8E8(Wqu@y?@BI(btVjI&C6b5PRFSF zFj3{}R3s!9&5P6_j%dX2`DF<;lPc^-#x}W1UtL7s2^a+r^@;pjxWW!5qlTa)jy$zf z>ox*_h{H~|p$}WJABYhDtbr=rXJt=8D*z`DRsM$+z#oNB#xJ_~-wOz!NlsE1SjUT} z*Gs9jzPG@VHO63Olb<}AJ)VO?i)$>ue2aLs<Z|5Hp*zl)9kDdeqUEC0PwwcmQO$}< z!!*lsbK-MhC7hu>!CKf%ttFeKCC9i+Bsh90EHH!Dp8ye38$BdmYQ6v3t=8y8g`QFk zT9WMGTiUka1`Un4i776OX3ifEu^Ni{Xd}#t$LlCs{pgLrp+>{PTJpGURg$MSJ>_Ym z7Br!9@Xq8T#?BbB8X_B?EhtYF#x5@=R+P@yv$pA#=*7Uo@`L$dPD%m{ehfjIh{^2m zEo*RVu;8HVHqV1sie4m|S$CcCQNqtz=3PfGcau>f3)3hqom_~gveJ5w6kPX6$G?Xy zKbyK|0aJr$z(=HdJJlH#C-x&Q9WgK7GEirLj{GZ^ars4d?}3>IzBBheUrliFY~qpU zYLb)L*tI$j&Bz{yhKKP}s@3Nbi-KkJScrGUDvrx$y)=9A3>*s6l$5c&;dzeiI1(+g z<J=KoUm(h-r8V&HOm*_(I_Z}Za`OXaMMB+H=OpY=Zu7gIsuA%xJ}~I4iJSOgTefgc z!r)1Kh}sOsL&`hZGKkK3d1GRSFY=^^>LlHdYLmXd_BketAI2p`rfkofvTvo!uUH3x zKdh50<*i)ylH!$5UX;c{1oGZR%HER=C-U3Wk0NyBh+DTW26K>wj<ae+eFjhQohKxg zGRXRUdiU{BuL*hsSLEv-`Sr0XDp+7EmZCoaw^|wqFiht{_k;i*_*NQqN<=mFFsiL0 z2nv$+`u_O!DXQw2tODlTzz!;`T@PB$$QHJl8TF%pPs4V0p|XM1Oy));1I|=Fy_2LX z2{t56jz}2X-`GZ-GI!|c)hjdA8r$hw%vVcv&uZPB5hP_@uo~jrxl;K<DsLi|4*6_X zIhx9`7gjw`+0lg?n6NF=uChw)wqb^xkW&w+C=+9(m7}@oi}|9$@8i;xw%wAq?|&~W zj;~47cY!>J9s>ZN`ZJ_Df?}zwnX`(StLx98%Jl4-h0)l`{<|uR&7vWSPh(vF#Uv!0 z7Hd#U>D*Mm^I`={Qe2B<VvOk~MPRrZN>f}chOn_R^#k4m2@ae2cjUpP+=P37`olZb zU|@V#rVG_ktJm?Eg&*>bttgjp1SH$7gy~#}3_i)&S>y*}gzuXqbQP8gmFoht`bjxi z+0zBA=H4Mj&7)lOHhc_08A&IyM7XEfx}|#>HL@BfoQFBP2VykH;>RL>&>C~o)_4xc zyV*|_3_IoAC+yh`n&|gjz$UM%q~=46bZ=hIsyDMv0o=Hr5SdSLP-%R;B|W`#^@G#j zp!Cm5>x#uzOlOE^!qX%5@-P>;d3Hs|&k;w21*0b&i&#C_5mf|v;Ehs+4Bt3TQb*P) zVN$T@4#2m`Gx=kU#SJ-)vA7k{+T^9n#!bohudm8JY<QL10U(yEkB=TJc$VjlZ?N?8 zSCcX#9yfa*-_%{&pVdBW^KzG$<aQS@PnZ9AM@ri!K}6k#v?92k#obSJ1ZdE@UE;LH zYr<wpUk|zfns6|=^L*%&xpe2=1geZ(-N0V>SjU@f^@@Tiy#k`V_{~XEJV5ZbE5=VX zeK=Ym7Px>SCMrmBGj%XgbarrbVKQ-WHv8EmBF_7-(gqqiKxCYfLLf6RcvbEmx!_pQ zF#Ri(=9C#zORp&#?rPelJ^Q5af_<c)LjWSn?V5?#*u$GKx%fUQ%oWsn)Iw<`V9+2$ zpETo?fLPUHqTf3{lhTcPYK(#sut3cD3$<?AZfQiOmJhFV!1`Ut&0xxv6LfS?BN0c0 zl+n3Doi{3{;<P=cymXZ=rLO!pncKS1=(neom%tyaiSyXv>cF%JTqnS|dKCR3%@CvC z!uWYHSXw>e?<K^lz%8m)e&s$&`K-l+bQF&oSW|hBljX{y`v}unmCdQAW>Dg;fuNY= zD4qgkEt6@-&aZ6dvd-}BL=nGU@`t3ohL)nqto;Em*nRF$mMr53=4Ov^=Q6yswN=6^ zVT}?$sHR=gxQ;JkuhaP$Khh=i8R6fpFTF2bbd)!DK^qrXfDznT9DE4ogT5hRfg56{ ztZPL*0UvBx66}<^1nn*QXZDteGBgYU@sSWD^q~Bek4BD;|E1$kBK~<~#C6$&6wQ!h zh)bl9qo^fA?2uRLO7(be=Bfcwt!#8(YZS#;MQ0>0&-3jHoMw9bZ$wX@<b3ih?UC*j z&r^nqHA@e~O5q|Irv;8^FPa|QFT^l<QEXsnj0>YB_xpYC4QIIBQs&7pCP|eGwRh|b zUp8Z2y@HR;r<NP`GL$-#FD^PkI*#{RHZg6d9~s9*j;!gwE%UM|DT*%7dirRUx%5dw zVbO%@)69~)-VY>Adn-TBWc0$2cU91#U3<-zLH2=1FTDg7Cih-jb0C4QNSQ3YB4)qU zWk!bS`7*P{ruFr#Ok#irYs+tBE~(5DsvE3WncoyS_JvKg+z@tXG}od5O{e0!LDPEd zq7Ce^_Om&^+K~z3u0khE=72EA@TLp=7+(&X!F#5SSfh<h$D;rvG6yayZxe#vV}Xvg zT_Ooma=%ReG@@3!IKdP4#gV-E`k0!eU9NAtZ(qmM>@a6|&I&IX`JA?4g~)lP%`EFP zVHJ9Bf@fHZXJais{-^Q;17`p&NPfR>?%#9u@AGeV(J9LO9pLY~eg19u^ZX9v5P#YG z^W5<7TPOZ%=mF{n{?8jJp5r_h(tjb<fI8~WWcBC9&lTEV#y>S%knu0Q_PObEsp*#~ zG}3>5_kR<fo&!FYLVf`@fi?*I>p}hr_)8dh4)|PI_yyR4@*MD&&hQ-Nd588FN)xDI z3;J8n`?b#jp09*|0mOouzCXwK`MUTy!t({vFN8My-#*A6WAYs3dHMJYWsB$!lxM}` zZ;Q$2pntDMenA2N`y>FsKWdZb=6_Efe>HzY{ulFqr4mJ%7a-RF0FXehc93^*{H%fj F{|~e33swLC diff --git a/vendor/shodhka/test_20220727/README.md b/vendor/shodhka/test_20220727/README.md index 619539f..beb34db 100644 --- a/vendor/shodhka/test_20220727/README.md +++ b/vendor/shodhka/test_20220727/README.md @@ -1,5 +1,10 @@ -a) Sample raw data: enclosed is a text file with dataset download links -b) file types for inputs and outputs at each step (particularly for FASTQC and TrimGalore (first two steps) operations): enclosed as a table below (also enclosed the corresponding excel file): -S.No. Analysis stage Tool used Input file type Code Output data type -1 Quality check FastQC fq / fastq ./fastqc *fastq.gz text, html QC reports -2 Quality trimming TrimGalore fq / fastq trim_galore --gzip --fastqc --max_n 2 --paired --length 50 SRR11862696_1.fastq.gz SRR11862696_2.fastq.gz fq; fastq +1. Sample raw data: enclosed is a text file with dataset download links. +2. File types for inputs and outputs at each step (particularly for FASTQC and +TrimGalore (first two steps) operations) + +Enclosed as a table below (also enclosed the corresponding excel file): + +S.No. Analysis stage Tool used Input file type Code Output data type 1 Quality check FastQC fq / fastq ./fastqc +*fastq.gz text, html QC reports 2 Quality trimming TrimGalore fq / fastq +trim_galore --gzip --fastqc --max_n 2 --paired --length 50 +SRR11862696_1.fastq.gz SRR11862696_2.fastq.gz fq; fastq diff --git a/vendor/shodhka/test_20220727/run.copr.sh b/vendor/shodhka/test_20220727/run.copr.sh new file mode 100755 index 0000000..c265cdf --- /dev/null +++ b/vendor/shodhka/test_20220727/run.copr.sh @@ -0,0 +1,11 @@ +#!/usr/bin/env bash + +FILES=$(cat ./data/SampleInputFileLinks.txt) +for file in $FILES; do + # --no-clobber, do not download if file already exists. + wget -nc $file +done + +fastqc *fastq.gz +trim_galore --gzip --fastqc --max_n 2 --paired --length 50 \ + SRR11862696_1.fastq.gz SRR11862696_2.fastq.gz -- GitLab