From 89e23df4fdd51b1672d1f8c8582aa5d21daf2542 Mon Sep 17 00:00:00 2001
From: Viktoria Petrova <vipet103@hhu.de>
Date: Sat, 2 Nov 2024 14:46:43 +0100
Subject: [PATCH] add processing of rRNA data assay and protocol

---
 .../README.md                                    |   0
 .../dataset/.gitkeep                             |   0
 .../isa.assay.xlsx                               | Bin 0 -> 6912 bytes
 .../protocols/.gitkeep                           |   0
 ...rocessingOf16SrRNAGeneAmpliconDataProtocol.md |   7 +++++++
 5 files changed, 7 insertions(+)
 create mode 100644 assays/ProcessingOf16SrRNAGeneAmpliconData/README.md
 create mode 100644 assays/ProcessingOf16SrRNAGeneAmpliconData/dataset/.gitkeep
 create mode 100644 assays/ProcessingOf16SrRNAGeneAmpliconData/isa.assay.xlsx
 create mode 100644 assays/ProcessingOf16SrRNAGeneAmpliconData/protocols/.gitkeep
 create mode 100644 assays/ProcessingOf16SrRNAGeneAmpliconData/protocols/ProcessingOf16SrRNAGeneAmpliconDataProtocol.md

diff --git a/assays/ProcessingOf16SrRNAGeneAmpliconData/README.md b/assays/ProcessingOf16SrRNAGeneAmpliconData/README.md
new file mode 100644
index 0000000..e69de29
diff --git a/assays/ProcessingOf16SrRNAGeneAmpliconData/dataset/.gitkeep b/assays/ProcessingOf16SrRNAGeneAmpliconData/dataset/.gitkeep
new file mode 100644
index 0000000..e69de29
diff --git a/assays/ProcessingOf16SrRNAGeneAmpliconData/isa.assay.xlsx b/assays/ProcessingOf16SrRNAGeneAmpliconData/isa.assay.xlsx
new file mode 100644
index 0000000000000000000000000000000000000000..ef7ebe6dd6535e281c1c98d04ead35f96ca0d9e4
GIT binary patch
literal 6912
zcmai3by(DE)23OvVWqoUN~J+%>24%s>7`S^0G5s=M36>8kdW?>P`X1vMY_AwZ;^wZ
z*K^+Qeg4>Muid$4p6j03nfcwTs(_4wiGY9rKp3?%(~F*J#?V7VK-fk>Kp=vDY9Qla
z?+UheHP-ZU1iKh<dqV6A<CN@Mc=4e}V)y5{<gtx3weGiMmUolp?IR3(N^??9?Itu$
zc@VPZv(x6A5OE|5Z+WM--BPKH0F43V?j?n(2@zvV4zWSVYL1hea-!%n0NO8{NL@-~
z2xDjMMW?;80+P5EG9w2iKp=1gj_RVQevu}(0RD*(XI79i23Fir>x@5VN`%#8asxcI
z@Lb&wU2XH=?x-UvByz&ey+@x*oe{rL7)j698X6n~#ZUuodAO73SL7mM1&D&IIF=BD
z8a+}K2QXuA1stQ{yqh2Eh`{RRS&E+k#}cs_X{`{x<j}#XGM`8G%OvL$VqP07K!l)Q
zoGUAq8axojb>83VBslS%yL{ps(3gWQ=VS@97dz}Lk1~{zJRm@(2~R>l-te7?H8KV*
zTv|WJ(ddK3WtV*y-66m^{$X^P{GsyRfn5OIYWEv4!im$>60>_8&{Y%zcZq^o3e~?d
zf$%dEaPog0H26DXXRw_M&yCG>wszA%lPmD=6p#=QuzuNaUs)E$d{A!X#g^Rixj%pQ
z+FlNjkzGfd^_5vbyqVFSq9Wo=oB!rk2uu<?!Wuo&X?@AEd#zVAVl_hjkP@5o9XT;-
zcVAFnbN8jS6COJjS`Y&|zhf45(xSzMB7=NhXG4@8iChQTlj!4gw@NXk1dd4JE|qR;
zX}126m0<Vg$o>4HE!We|=ZgV(m3@+vwM=g>_=W`S><t`NqBl%4X)X27yI9Q?sX|_O
zjcg?c>MUlks}3v~X^+>Pi{+-u4P>NOCR-6`<SEZ~>o>VkP8ne=^@l4+SN*7=d=2$u
z@X*6}e9k|_B0S)OaKp$ySwn_1;%WDbvVR(2TpRowvjL1H+E>ihz?migyP1cBv#ptf
zgYDHX;f83NR$hGBtqaVOBYk&$dA4X5wikv5N5}!?m5O#CD`CjRkrss<B_IPmt*zj5
z;wQPa-XoD<6~z(s;&gU-{AH#04O_%M0#j#}_-&I0Vkl9V%#5E$Jl2FM1(v9seHo*b
zMA;mBcJ9mb<33cnAH2M$L^1UCPWMRX+ulbWtUBNm#^Eo>t5_-}Wtc;K+O)6PW}nr|
zOdX;b``-y)K9LV#ObzVeAy2t$j{4BZoCY>Nr=#%E<y*VUX__eRI|FRIFzxTI(r0~a
z65I75C&#2cb1}TebQ_&?ySL^APVe`A%Dd&YGq+0f--*V(Cg_S97b`H>_0KY`3RSBO
zfD_pQCmi?>+n*4=D?VSwt2rd`;y<50;($$4hzK*%A?3TPRe+KNASs9IK%xSq2bHmv
zX9sm63iCzjqj=FG6ymsNjmdjSOGOd5(iC~8e$AY8(aSaY=1m+O{Xu8%NJ7HFzU}&>
zVSe=h8T&50lh~oC9D<eyfMq2qa@!y`N{Vm6k%@`qvQf7yhN#Mbt44NcT)GR?tCI=L
zo%EXt>zyI*$F@x0*2Wv!5l?$$R<Q(=a+M`CTF;yGl}9$AkMmtr(-c*&qRHBUIX1%l
zW8TiK_18VJu7vEArJ42}CvNx&A1gZ-hUaf!J3S-vJ?qs=ZkJ=<lb<D{)DauX<nG`q
z*kXlM_k8U=;_h^~n=jjYSa?yCDvnWO%ekp0PhU}0xZY0YgwLf+!ssP-s8(U$1FkK4
zB-G+)SnQXzvOq#%p_gcTKs?ihyt&&Pc?PfrdT}QX62~rn@^;ukqvQwDbTLNZfvH{2
z=~i3b(21_@m?V2pwbUJYx+V+b&Gd?WI}qW)naQSh5brYx*e0dsp<3dS@l=Sa0xlIw
zdvZioQ7(b0qb{RfdDV|XmlikAYwXUAU??QsvpP$%H8Kejjgq`-JNQ}n_0CqA%XA&|
z+k$=}wL!Ge&B7SW@-%*iNXE<wZ=V8&FnrQXq!9r8m_FGiEr@^^OrLiqf-idfV2z@@
zrg%7|L8pfUc@_lbcn2F9KPHL18z3h4c3!TetSgO#PQGwt*w2fqwS9-?0o5wk8q43L
z6#QHX6@TznsxVFreJA8h=JN$U8yBCH$0=(^dikiLz7O!zGmc~{VgEJ@nKG|R-68B6
z&ymuYC`BM8@h1ru!xH^T^aBO$N~e?w=&QqLJ+zIKO<fW<Res%Ixg`QL9pK~e0el=1
zUstY+m8mn>T*KAb+TPOTXVu2_!aFT~z?LX<;hx({hBPaPM9Lp#MZvVt>;$TeVETbl
z>_1ucDGwis{Qmy(SBLcyG52y2t9J2$=yK*o;aE0HD|Q2gvZ#}8p}NL}aM1+vI6>eZ
z1EDda4nee~lnv`*#L-3yzNX;Y7tEFSiSFK86FBB|^_D7>d7CG-uOBkudY6nmYo?$y
zWrr`VS7a^RXKVYi4kpVO+reV3ms1?Q4PrcP(TN5`+Ce2#WFkJ6ZIrbCP_qkDE-TN6
zohp^N<xUS6WpY85*v;GdDYPLaHsM<C&nQa{&}-X9)Ax}yYLKRl`*{;UP&=H{9^rim
zVNDrJtVPqr*B%9(g5ie(39H(jU9Zu%X&FDv2dLnN;##il>vZjcqamTArK~}|^K@}D
zw5fEAkd8hc_Sj8{&+=pIopL-<gRIrqCz@|$zXcreZesL#T$ZJcRbZjt>05VK2W`_4
zzA-c<iR^c!=LSvG*t43^`=E5P+$89~wsTi2Fa-Ro>tE+FrcaP196m+cXs_2A_*l3$
z`}z8_`E2N^I7|r<|6upqEHXFPO-r{o?RFm)viAG9F~GnuO!`<}K#n~`jTksN%#DoZ
z+RBaWK4l8jHbK>1FU2EDZy)mw76V-}Oll@oS`V5!AtYrz-P-wdL``Gd_HJB7#)k4S
zHy}*k;v^J8F0wlTlbwtAav0zdRFsh;#vuR`*eBlR>{%Nx%H+EB9iM`hDuio<ADJ!J
zAfCww_+S<@X%>(g0mO?A;HEK<iBy)fl`9N|j2GZXcL>lE`wcY=1|NS0GP3t(?@~jH
z<wDJybI+SqEPE8PKF?$&p9d#yvkFHNKoWWTVJX<#c>*}00RiY-!^#plZX5X(#F?d%
zLM-Dd5-v40&5r7zh2vvKwq=nb4O^ZA9sY}?>PHPaYoqa}>Il2Oy4HGc${y_`-w{IZ
zdQJZI>ys*d?d>}kqc}cON|(ewZcq=Q?Tf~$Qd8VG!LK;=Q`YXa`A<Ed#gOl7?saP;
zBtDp!tRc)4R#Syq4ed6sU<7Zb^gV~&P7k^$8>RJXmb>N|^oVWg?wZx(Js+u&i|K%s
zu~E~}I8tZM!-yUSg(Cy%*+LVZo7R~fZLs^WJX4;O7YnWA?E+cKG=2uk9|K#K%-IbV
zxdv<&X?cw6MZC|?*LSuoRZ^41F5SeBa=r+Ke)Ostm+;-|$1^5>_TzAFEq8i#hd%1r
zLAOrv<?)`<YPR%Ron>*Vg!jqC__K?1O=Jfb*MuNExnQUhdK%C}4}dkI_#E$~4up*)
zON>E`ppLxWDT(+kkuJa0?Y&LQ86`gy*ONh9y_y<DG+q|Do+<#-@fF{ssbO96RHxy|
zLffFO#GR<U>N)_`+T!6D<(IHr{9W1HA*}b(E@^&MgTRNn<ej&LKIk$WKF4n_s%u+P
zd><`9jsM0!c#IL*ne{+=iV>x$#}(znXeh*ei-PKb+iKmh?){cZNzGhBjrMS1RZg|H
z;Be{J4>xIVEz42&R2Ksc<+k^M8W#J3x`31(>NGZ22bsXZI^S1)(j=WsiOaBi!6l-l
z-OP`kx8%j&4)GH`%t??8rhl9U;=;(;gk|A9l~l{9+alteh8RryV`t&P=0QDf21vKv
zB>I*CrYXBZcrVu{7iB4^QalR+4skycr=-(;{Me9mS2T%VY{dZ4{3WEItd}e6qs>s%
z`{(>@dA0(POwt$=$f6dgKJJ#bA(nxe_&fBy9?Ui!``_b+bB4rLRpK<|Jxi?*7!PHG
z`?B36B;|FPd^4iPZ$*7`i+a&B=-u(%BmPC(Q~N1w{Pxr5w`f^;T~|nD%^KuNQ`Adz
zIfT`PH@a}f^c#p`mJ8ea^(W?@zAjyQLn2CMyh@xMcYu@&IHKXSt!0fo<V$9JrPT}8
z+Iv=D6MDD{=5o>NHXP$mD~Q*7$)kPArIOFY>9cT~K90KMR{K4AE+3Tj3sV}jVP*Dm
zpH=~!^gC(FA0qC^PoY`vV$u8iBPf}^cD~!H+oKf)<pU$hvy`cN=s#(n;ij;7v#>jx
z%?zNeArBg|<->)(?s;H)FgjJ2eOfL|>V;&Vzkkl?9Gl0OPfmESdLkFM5oR_x^4=<L
zx~-+l3l*0InaQEmh~+WL3>ux7;(1&rPrdg{DmQ;l?Ruz%m(o&;Xd$cvnj}w87Klhm
zz1B*$zGk7ZwHg}#pkas42Lf3{BhM3?Lpd}YMHLi(UD-o$K8(`qh<Pd-lZQ|BkZbsr
zi%gS>MWQoZogB(7PT#mf2}VK}{}_BTu`M+6!s?eCZfAQ;<K+?(-Fj=vAKwrhf<JWR
zWA*bhP3F=7l<#t)4WWP7ZWGDkYYJ;twQooUI?4qY>buB!a#!nU8!G7R6}~mBEU0A7
z97gC>iSyy_|8DIKVyTLZTRF|=Ou@kWbP*=vHqBigFMx#$dtyp@<{9J@sioE5HM&@9
z(fV|cZD$5uI#ORor7%BN+tuCBL<*Kvq-|0qpCK%<Eub5v&!MA}(-2_*arZ=to`%{8
z=BS(Vd{WLhKO{Yh)?=1?NH(#cNzTW@wU@C`NmV@igsE=kP+oboL;<JDh^xY=N`JEk
zTsM^`iu9&~ma}f+i|?^zTHoTU!<FNY?Y`Bl6~)J#<+}Rl26>K8oQ#WzjlWQ!aPGa=
zUJ-uRt6VrzP<h6bJ7pdB`ca|A>RA1gs_BC-56XUY2t;bUA1->LTsY1;+Lfx~Y~wE7
zG{`xcBA>l6G8K_J{8XSyu)t@hj@O}UZL;ZR#$69D)O*h#xx?3IWcUEX`D+Pr^|Ay1
z+&;47jNm&nap2Yw2j{c~G7e|Ra~tbW&AcRb!C3dT=b(a9<XgkhN@rX5&<F|LCUXwE
zJ{3o$?VaAPS;>;*=@Bq|M~to`{y>qWcHZXIY;n?;q{kz=`SR@LW^Cf`(WcF5Vm?x%
zcu(H8Ai&p*oo%Q%h=JvNz70y^FuIM(@KPv7fB7|)wN0zlL^VhqHgNQqo=wM-mJ_@q
zfe-3+G4O`Q3s(4aqgDl_LZdn3kM3pTe8qH}M7^z_&K<1eSumhb94hw+_;tDK5n|kO
z{w%8ZhMN>=04Wj1dj|$of}K{=89jAtFoou_w%%vo^m{?wmf213zTn((>gbA*#)810
z>OGw(uIx1;>16Ecly@_PThOGOKZia#=L1MdJRE%7!bRd^TTRrdn&CkH-I-3gNLm!2
zheTnYsCLJ70O)`#n4sn;h^Cl!6t$j`5kwo_$Gnd-^3_J8MJxGmjujkY@)C*>xOG@m
zQOj&Up#OQ9lkLt|>-$g{YRhm$6D;Po*t+8Bd@Oezy3sDf$us_T$DOaMQFK7^R>a$`
zls}S%-cLu|H*)Kg$T*WG+m8+X0?IiK^QJJ9PKR_u7gq5CU+B5Vjz1l#{p75N3S@d`
z#j(C9kTA=3*(3k0Ydh|s!?>KPEa&(`iY9&?c|jRo#D>8LdFpJM$GfPo10(7uF3$vy
zEXFx^Ne68<?w3uCK1ty@A85L8JG7bJvG^2(1_LwDc87;i^-3t|hxXs~zj*qi`LO2b
zKJY9pv-xP(R$|+NFU5QB`0nm5D`0%b&W&tgF!5+PqA5Vd&xD_bi|du5V>|bTL!Xui
z<MJh#VBV9^{Is!b`ldkteF-ync&zH|;P~fbVCO<BH~_v(Gs7Ru@!@s+%gof#@oJGy
ziIH-c;>Ct;osk4?MkL#_21;u4Wl=oQEkOWH%{6zra%#q-L<`1ToOa^Q-d$6!6N|y?
zPh-oUl35C+CYt!pQDPXEDd`{$xo9Mes&mjuyDx>^h(;!=JsZque}G;AqBAoK)0{_9
zd1;k6Coj*><t`Z}dgwJ2FoL+mzX7%)x83GW7{?XsUMsDS_B7cS9Mf^aB+hNq>i<EZ
zkA8c5aCj5wlB#WN<~oM3ls1AlmL-`nGrRU7UBg*i^Nv;6qM)Ams(PnaUL_i3k;{Ag
zW&-w;G1VhLYoCw_k@e_a{=-%}67y$Eg+^hsWcauuFPG``wmFq6HTZ1ELSmodu0Zu=
znVE7IS(m=mRHp4a3z$1u#}Ubmy$Zh9jl1%&>_yuT+DCmM57GD@m!n9$07P!#_tTtl
zJf*4yh;OMXuOf=BJ8dhk)*bNd13hMNf&B`NcKHx2jJ0#_VFpDUw>0Zmit{znbLzFS
zr3(|0klf*kwT0fybKUqkretsVMx*LW<eS7^cb?q12Es@1jLpHj55eCv_SnH0{4-_h
z-B(&*{SgQKv_Fv_J28~Df+Uw-i(Tv8H$!g>?hwd?g3M)OpFaY7?l*ULi%(~cm7?0<
zZR9afAt__3EF(gD1uS0|R@KX%9NSE%;rCMigP*|n4*sU@YEVt(wpj&Y7@^_!h&Y8B
zJs4Fch|SFhoy3KxST*&FjRD{O0O<&Cqb2HqHSyPBOc+LBcx7P5Evilvwqq-6+{$%q
zlw4J5R7|P}7Ctds0=or!Qr8}6Y0PI}HJe!Uo73fa)`GPs>MSWEM>NAx2Ya@{Hmq88
z?6{2mC@M9mfs>04HpQ-m{7<57z2bDGzhwsvJlxzqz@a?b2l#L{J8|Hg-aDArYDs&H
zr&L(znA#w{kqwm2fDCI`&P#Pt7G2a-5w^*=Y##8u#Hrh`L?Ad$$+|#O>G9q@F4v3p
zAy=|Ar3@N$C1SDWSF!B0oZ8d6n0QZ4eNr{oX_BzDYP|Tz7_i`yd1?qxhATW7c-Ld#
z?_yL$jFJjm@C)2J4`n?n<nl)xodf}3?oyP`Id;`O!s2<_S9E`f**}cNC*yWnZ;LX%
zr&p*l7R>Nq=$lq)!jgKrM&qEpPG{A4?nEJRT(h7_eXIPToU@T}fw-@zU4sOm&qK4*
zS3aYMU){T0(uHPV2ekGE+GhU+OiV8=<K1Si<es?H-Q(xJtH?U{4A=;%XhAQ&8^)bN
zM}Whqt>R5(m8o|?lMMA-Zc+520G5nC$bA|hZ>m)@afim#wt7v&Ni5py3>{Jtn(C9Z
z7=B86k~>Y`A3FQRxxuF5!_nRdYQQ$O`&+XtUdfe`L5w7MXQerb9UWTtna1J3l)C$k
zFujXCLLN1N&(fAd9PeH)pXYSHt7pyn9)mHbF!E4UEGX!U8kMgBUr~~U2$8*J7KZq9
z!08SVV<e@ZH8lnno8WYK(xMFlm<aSjt-zd@VI`-7$KfMIY~LxCssbVsF~WaW$>G`f
z+xZvG{I`RDcFZer_xfBl#ZY*LZv@Hz4Em?odxJtiDEfu@sYw2R!LBsX>vI*X8D2_1
z71EnX|GeFmMtXg&05jKsf4|_Ln&}M?{@(&TEIiIN?C(YUKks`bEnc6i@N94y2JYuS
zgvOhzUw5oOrN$dH0)o~*u)l@J-;7;*`BV1!?FA40=MDZL0{!;zzbJeU`03$BrTEY5
z|EW{_4m|#M*l*S1ciey96@NR3gZB(LcP_s+$KTNZb!9=qzYXi(u<M9_PW9gr4gU`N
zYsUYH{&T|oM&rWuwqF~<&Aj;&{%2484NoHZRVp`fy{ZE0&)*t8eEawauSiC+EA#&Y
D$2oEE

literal 0
HcmV?d00001

diff --git a/assays/ProcessingOf16SrRNAGeneAmpliconData/protocols/.gitkeep b/assays/ProcessingOf16SrRNAGeneAmpliconData/protocols/.gitkeep
new file mode 100644
index 0000000..e69de29
diff --git a/assays/ProcessingOf16SrRNAGeneAmpliconData/protocols/ProcessingOf16SrRNAGeneAmpliconDataProtocol.md b/assays/ProcessingOf16SrRNAGeneAmpliconData/protocols/ProcessingOf16SrRNAGeneAmpliconDataProtocol.md
new file mode 100644
index 0000000..534e2fd
--- /dev/null
+++ b/assays/ProcessingOf16SrRNAGeneAmpliconData/protocols/ProcessingOf16SrRNAGeneAmpliconDataProtocol.md
@@ -0,0 +1,7 @@
+## Processing of 16S rRNA gene amplicon data
+
+Amplicon sequencing data from *Lj* (Thiergart, T. et al., 2019) and *At* (Duran, P. et al., 2018) roots of plants grown in CAS soil in the greenhouse, along with unplanted controls, were demultiplexed according to their barcode sequence using the QIIME (Caporaso, J. G. et al., 2010) pipeline. DADA2 (Callahan, B. J. et al., 2016) was used to process the raw sequencing reads of each sample. Unique amplicon variants (ASVs) were inferred from error-corrected reads, followed by chimera filtering, also using the DADA2 pipeline. ASVs were aligned to the SILVA database (Quast, C. et al., 2013) for the taxonomic assignment using the naïve Bayesian classifier implemented by DADA2. Raw reads were mapped to the inferred ASVs to generate a relative abundance table, which was subsequently used for analyses of diversity and differential abundance using the R package vegan (Oksanen, J. et al., 2007).
+
+Amplicon sequencing reads from the *Lotus* and *Arabidopsis* (Bai, Y. et al., 2015) IRLs and from their corresponding culture-independent root community profiling were quality-filtered and demultiplexed according to their two-barcode (well and plate) identifiers using custom scripts and a combination of tools included in the QIIME (Caporaso, J. G. et al., 2010) and USEARCH (Edgar, R. C., 2010) pipelines. Sequences were clustered into OTUs with a 97% sequence identity similarity using the UPARSE algorithm, followed by identification of chimeras using UCHIME (Edgar, R. C. et al., 2011). Samples (wells) with fewer than 100 good quality reads were removed from the data set as well as OTUs not found in a well with at least ten reads. A purity threshold of 90% was chosen for identification of recoverable OTUs. We identified *Lj*-IRL samples matching OTUs found in the culture-independent root samples and selected a set of 294 representative strains maximizing taxonomic coverage for subsequent validation and WGS, forming the basis of the core *Lj*-SPHERE collection.
+
+Sequencing data from SynCom experiments (including FlowPot and millifluidics experiments) were preprocessed similarly as natural community 16S rRNA data. Quality-filtered, merged paired-end reads were then aligned to a reference set of sequences extracted from the whole-genome assemblies of every strain included in a given gnotobiotic experiment, using USEARCH (uparse_ref command) (Edgar, R. C., 2013). Only sequences with a perfect match to the reference database were retained. We checked that the fraction of unmapped reads did not significantly differ between compartment, experiment or host species. We generated a count table that was used for downstream analyses of diversity with the R package vegan (Oksanen, J. et al., 2007). We visualized amplicon data from all experimental systems using the ggplot2 R package (Wickham, H., 2016).
\ No newline at end of file
-- 
GitLab