From 57b33a9281d79f78d35948c1bf1ce5112f1791cc Mon Sep 17 00:00:00 2001 From: seehagec01 <seehagec01@fu-berlin.de> Date: Fri, 18 Mar 2022 11:01:22 +0100 Subject: [PATCH] setup --- .DS_Store | Bin 0 -> 6148 bytes config/config.yaml | 12 +++++ workflow/.DS_Store | Bin 0 -> 8196 bytes .../2022-03-15T135851.892224.snakemake.log | 4 ++ .../2022-03-15T140112.429011.snakemake.log | 4 ++ .../2022-03-15T140222.370755.snakemake.log | 4 ++ .../2022-03-15T140225.807213.snakemake.log | 4 ++ .../2022-03-15T140318.383706.snakemake.log | 4 ++ .../2022-03-15T140349.569585.snakemake.log | 4 ++ .../2022-03-15T140610.870264.snakemake.log | 4 ++ .../2022-03-15T140703.847723.snakemake.log | 7 +++ .../2022-03-15T140938.788774.snakemake.log | 4 ++ .../2022-03-15T141038.010182.snakemake.log | 7 +++ .../2022-03-15T141257.023361.snakemake.log | 7 +++ .../2022-03-15T141415.922744.snakemake.log | 7 +++ .../2022-03-15T141432.576962.snakemake.log | 7 +++ .../2022-03-15T141436.384821.snakemake.log | 7 +++ .../2022-03-15T141447.281345.snakemake.log | 7 +++ .../2022-03-15T141505.214014.snakemake.log | 8 +++ .../2022-03-15T141509.059492.snakemake.log | 8 +++ .../2022-03-15T141559.573733.snakemake.log | 8 +++ .../2022-03-15T141603.058242.snakemake.log | 8 +++ .../2022-03-15T141609.906141.snakemake.log | 8 +++ .../2022-03-15T141632.425650.snakemake.log | 8 +++ .../2022-03-15T141842.449333.snakemake.log | 8 +++ .../2022-03-15T142135.708957.snakemake.log | 8 +++ .../2022-03-15T142139.848286.snakemake.log | 8 +++ .../2022-03-15T142146.756227.snakemake.log | 8 +++ .../2022-03-15T143128.835585.snakemake.log | 6 +++ .../2022-03-15T143316.866263.snakemake.log | 6 +++ workflow/Snakefile | 18 +++++++ workflow/envs/.DS_Store | Bin 0 -> 6148 bytes workflow/envs/yourenv.yaml | 33 ++++++++++++ workflow/rules/bowtie.smk | 32 ++++++++++++ workflow/rules/fastqc.smk | 25 +++++++++ workflow/rules/samtools.smk | 49 ++++++++++++++++++ workflow/rules/trimming.smk | 8 +++ 37 files changed, 350 insertions(+) create mode 100644 .DS_Store create mode 100644 config/config.yaml create mode 100644 workflow/.DS_Store create mode 100644 workflow/.snakemake/log/2022-03-15T135851.892224.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T140112.429011.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T140222.370755.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T140225.807213.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T140318.383706.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T140349.569585.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T140610.870264.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T140703.847723.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T140938.788774.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T141038.010182.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T141257.023361.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T141415.922744.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T141432.576962.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T141436.384821.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T141447.281345.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T141505.214014.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T141509.059492.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T141559.573733.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T141603.058242.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T141609.906141.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T141632.425650.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T141842.449333.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T142135.708957.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T142139.848286.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T142146.756227.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T143128.835585.snakemake.log create mode 100644 workflow/.snakemake/log/2022-03-15T143316.866263.snakemake.log create mode 100644 workflow/Snakefile create mode 100644 workflow/envs/.DS_Store create mode 100644 workflow/envs/yourenv.yaml create mode 100644 workflow/rules/bowtie.smk create mode 100644 workflow/rules/fastqc.smk create mode 100644 workflow/rules/samtools.smk create mode 100644 workflow/rules/trimming.smk diff --git a/.DS_Store b/.DS_Store new file mode 100644 index 0000000000000000000000000000000000000000..9f0666a725ddf766c61ec264e07125e59af3793d GIT binary patch literal 6148 zcmZQzU|@7AO)+F(5MW?n;9!8zEL;p&0Z1N%F(jFwB77k8z-DAJq$iaZ7bNB6Cqd;# zsnHM^4S~TM0-(Ih#*oaA&ydHE#(<iCcO(_$WEPhg7+hmyVrF4wW9MM!;O2-8&d4th zE=epYEp|#QiU#pQ^7C_&VC=-Cu*}r*cmWaT{JfIH%)Hbhkdolcl+>ieqL}c^yp;TM zr~J~qlwz=6s00Tm2WPy1M0K@^silsBp}A$PjzYDik%5kaiLqI2EhmSlvc7dte0EN5 zUVaxOI2josGy^Y`hEd%N3=AlKN-0jxNy^X90ck*y$VoR0PR`FQfaqkLjjk~_-^B%5 zm~n8$S=%rCc-RqBO$tFZ1sTZpfC^ny2bKjF<>ln(r9%o*1`dXDhJ1!1hHQp3h8%`` zhH|7rbtp#)hQE*_2161xa{3#<RTWymAV*NO_bp8>NCaV+m79-<Bz)>nB8u4nlrAvL zLW?YrnxTn7*#Q)&+(Xm(qpltefzc44VF-ZA2L))A<N&2Xr7$A{14s%)fV%*U3=AwV zXE1{M0bm6ntspfZtsoktm4Ok&0-FWa%D@QK$_Va;fb@ZDM+Qa)uyzJU2C#MpMh38U z23V!f2+_{K2(_6J+CyQ4XlG!AXlG!AXoop(lpYO%(GY-!05gOZ0M-Al3=FvX{}5H9 z<Y)+thQP240Y(;=U>7HFrHtKwpt=@RpC&-1LA5`qI!12@fTWoq1BwzLHV88^Kx%SE Z21rfL$N;IyM;ij5&>6*}Auuo@001W{*=+y- literal 0 HcmV?d00001 diff --git a/config/config.yaml b/config/config.yaml new file mode 100644 index 0000000..8442899 --- /dev/null +++ b/config/config.yaml @@ -0,0 +1,12 @@ +--- +index: "results/reference/index" + +samples: "resources/samples.tsv" + +bowtieparams: "-q" + +# schöner wäre sowas: +bowtie: + N: 0 # Sets the number of mismatches to allowed in a seed alignment during multiseed alignment. + L: 22 # Sets the length of the seed substrings to align during multiseed alignment. + extra: "--ignore-quals --end-to-end" # users can put here all other parameters or simply leave empty diff --git a/workflow/.DS_Store b/workflow/.DS_Store new file mode 100644 index 0000000000000000000000000000000000000000..294de6bec7faff2e889ed62c1b20f8f1aa172492 GIT binary patch literal 8196 zcmZQzU|@7AO)+F(kYHe7;9!8z0^AH(0Z1N%F(jFwBJv>f7#IW?7_u2s8FCpC!8BBI zlo}0z(GVC7fzc2c4S~@R7*rv^2yqPuj(Q&=J4%j*z-S1J$PfUP4+@aBJ%a<3Zh+7r zDF#Lc25=XEk%55)7C?;PegFeV4x|-CgS3KZkX8mp5DRPuSSte~R4XI68v@cN05*z| z0j!;Y5o|L^9ITyz5o|L910zH`10&RCMraR(5u%-e5u%-e5o|ly$WdZ61V%#uEd)S) zcP<7!hGK?1XuloWf6qxb3{K9^Er6(3dBDKHfK^>?zKcszPJR+-AmNJP*XraChaGXN zO(9xsK?aijj2l4CU|~pQ$YUsDDE7?BPlnnF%I+Zh^!|eZNEriMT}p9sPEvk;4oDO( zi0U!v6%3%#3u-X3XFT-nHzz_o1J|3IkMICCc@#%87=Y~MWXNO4XDDGvWk_PkXUJ#B z#&G_61_lOX=VQ?U^9ZQ$!y=99C6KKQSX3c<j=xK&ITGSItSS-S#IF+7!(f|P8HyN6 z8FCm>(LKu8jpk7#l}Y8r1<)AXkyMbASzKaZaE+0PnT3^&or9f&n<F+jBfmVjB(bEl z*eS6n8pI39&(BGMu@jTRGE>Xr1w@?l^GXsk^HPgIN`f;}Qj-#kV!|`?Qu524@=Nnl ziotrJ5*(Zyobdt@)zv1ZmO2WC=9aZO3e}cI2098R#%8s(oE)Oc`qn}5**Up+`CVY& z!7CsJUI-sff_#VMBUqGy<dK9?ql#CBfq?-@7CDNhsi(YM^%0zzP*fnI2D=K>C;?Z0 zNcziyi}G^v^U}dpFarZSLoq`#LlHwJLjgkxMuh!Di!e0RFfW2qC7KkfH$h>5ZWXdu z4;^l;ho(j}bC5F}ZdIsW2HVET5DYKT(ik#9=@GTmU;+gJa<&6&8zn|VV8ny~GsLG7 zp#Hxr0|Tz{e~7A4ax?@+Ltt2j03(Y_u!|G4MS#tRpuRS!Kb-)T1XcK;?l>c;Uk=d+ zQUdDQgS+F5kV!?bYDNY~Po9wh(vxRoU;t?yxPbsrPep)%VYL1SN6#oRLPG!mWpq#* literal 0 HcmV?d00001 diff --git a/workflow/.snakemake/log/2022-03-15T135851.892224.snakemake.log b/workflow/.snakemake/log/2022-03-15T135851.892224.snakemake.log new file mode 100644 index 0000000..5043d4d --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T135851.892224.snakemake.log @@ -0,0 +1,4 @@ +IndentationError in line 6 of <tokenize>: +unindent does not match any outer indentation level (<tokenize>, line 6) + File "/Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/Snakefile", line 11, in <module> + File "/opt/homebrew/Cellar/python@3.10/3.10.2/Frameworks/Python.framework/Versions/3.10/lib/python3.10/tokenize.py", line 514, in _tokenize diff --git a/workflow/.snakemake/log/2022-03-15T140112.429011.snakemake.log b/workflow/.snakemake/log/2022-03-15T140112.429011.snakemake.log new file mode 100644 index 0000000..5043d4d --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T140112.429011.snakemake.log @@ -0,0 +1,4 @@ +IndentationError in line 6 of <tokenize>: +unindent does not match any outer indentation level (<tokenize>, line 6) + File "/Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/Snakefile", line 11, in <module> + File "/opt/homebrew/Cellar/python@3.10/3.10.2/Frameworks/Python.framework/Versions/3.10/lib/python3.10/tokenize.py", line 514, in _tokenize diff --git a/workflow/.snakemake/log/2022-03-15T140222.370755.snakemake.log b/workflow/.snakemake/log/2022-03-15T140222.370755.snakemake.log new file mode 100644 index 0000000..5043d4d --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T140222.370755.snakemake.log @@ -0,0 +1,4 @@ +IndentationError in line 6 of <tokenize>: +unindent does not match any outer indentation level (<tokenize>, line 6) + File "/Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/Snakefile", line 11, in <module> + File "/opt/homebrew/Cellar/python@3.10/3.10.2/Frameworks/Python.framework/Versions/3.10/lib/python3.10/tokenize.py", line 514, in _tokenize diff --git a/workflow/.snakemake/log/2022-03-15T140225.807213.snakemake.log b/workflow/.snakemake/log/2022-03-15T140225.807213.snakemake.log new file mode 100644 index 0000000..5043d4d --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T140225.807213.snakemake.log @@ -0,0 +1,4 @@ +IndentationError in line 6 of <tokenize>: +unindent does not match any outer indentation level (<tokenize>, line 6) + File "/Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/Snakefile", line 11, in <module> + File "/opt/homebrew/Cellar/python@3.10/3.10.2/Frameworks/Python.framework/Versions/3.10/lib/python3.10/tokenize.py", line 514, in _tokenize diff --git a/workflow/.snakemake/log/2022-03-15T140318.383706.snakemake.log b/workflow/.snakemake/log/2022-03-15T140318.383706.snakemake.log new file mode 100644 index 0000000..b0300ae --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T140318.383706.snakemake.log @@ -0,0 +1,4 @@ +IndentationError in line 6 of <tokenize>: +unindent does not match any outer indentation level (<tokenize>, line 6) + File "/Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/Snakefile", line 10, in <module> + File "/opt/homebrew/Cellar/python@3.10/3.10.2/Frameworks/Python.framework/Versions/3.10/lib/python3.10/tokenize.py", line 514, in _tokenize diff --git a/workflow/.snakemake/log/2022-03-15T140349.569585.snakemake.log b/workflow/.snakemake/log/2022-03-15T140349.569585.snakemake.log new file mode 100644 index 0000000..5043d4d --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T140349.569585.snakemake.log @@ -0,0 +1,4 @@ +IndentationError in line 6 of <tokenize>: +unindent does not match any outer indentation level (<tokenize>, line 6) + File "/Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/Snakefile", line 11, in <module> + File "/opt/homebrew/Cellar/python@3.10/3.10.2/Frameworks/Python.framework/Versions/3.10/lib/python3.10/tokenize.py", line 514, in _tokenize diff --git a/workflow/.snakemake/log/2022-03-15T140610.870264.snakemake.log b/workflow/.snakemake/log/2022-03-15T140610.870264.snakemake.log new file mode 100644 index 0000000..5043d4d --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T140610.870264.snakemake.log @@ -0,0 +1,4 @@ +IndentationError in line 6 of <tokenize>: +unindent does not match any outer indentation level (<tokenize>, line 6) + File "/Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/Snakefile", line 11, in <module> + File "/opt/homebrew/Cellar/python@3.10/3.10.2/Frameworks/Python.framework/Versions/3.10/lib/python3.10/tokenize.py", line 514, in _tokenize diff --git a/workflow/.snakemake/log/2022-03-15T140703.847723.snakemake.log b/workflow/.snakemake/log/2022-03-15T140703.847723.snakemake.log new file mode 100644 index 0000000..ebed290 --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T140703.847723.snakemake.log @@ -0,0 +1,7 @@ +Building DAG of jobs... +MissingInputException in line 1 of /Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/rules/bowtie.smk: +Missing input files for rule map: + output: results/sam/ERR024604_tiny.sam + wildcards: sample=ERR024604_tiny + affected files: + results/fastq/ERR024604_tiny.fastq.gz diff --git a/workflow/.snakemake/log/2022-03-15T140938.788774.snakemake.log b/workflow/.snakemake/log/2022-03-15T140938.788774.snakemake.log new file mode 100644 index 0000000..af61bfe --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T140938.788774.snakemake.log @@ -0,0 +1,4 @@ +Building DAG of jobs... +WildcardError in line 1 of /Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/rules/bowtie.smk: +Wildcards in input files cannot be determined from output files: +'number' diff --git a/workflow/.snakemake/log/2022-03-15T141038.010182.snakemake.log b/workflow/.snakemake/log/2022-03-15T141038.010182.snakemake.log new file mode 100644 index 0000000..599925c --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T141038.010182.snakemake.log @@ -0,0 +1,7 @@ +Building DAG of jobs... +MissingInputException in line 1 of /Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/rules/bowtie.smk: +Missing input files for rule map: + output: results/sam/ERR024608_tiny.sam + wildcards: sample=ERR024608_tiny + affected files: + results/fastq/ERR024608_tiny_1.fastq.gzresults/fastq/ERR024608_tiny_2.fastq.gz diff --git a/workflow/.snakemake/log/2022-03-15T141257.023361.snakemake.log b/workflow/.snakemake/log/2022-03-15T141257.023361.snakemake.log new file mode 100644 index 0000000..599925c --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T141257.023361.snakemake.log @@ -0,0 +1,7 @@ +Building DAG of jobs... +MissingInputException in line 1 of /Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/rules/bowtie.smk: +Missing input files for rule map: + output: results/sam/ERR024608_tiny.sam + wildcards: sample=ERR024608_tiny + affected files: + results/fastq/ERR024608_tiny_1.fastq.gzresults/fastq/ERR024608_tiny_2.fastq.gz diff --git a/workflow/.snakemake/log/2022-03-15T141415.922744.snakemake.log b/workflow/.snakemake/log/2022-03-15T141415.922744.snakemake.log new file mode 100644 index 0000000..37ae37e --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T141415.922744.snakemake.log @@ -0,0 +1,7 @@ +Building DAG of jobs... +MissingInputException in line 1 of /Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/rules/bowtie.smk: +Missing input files for rule map: + output: results/sam/ERR024604_tiny.sam + wildcards: sample=ERR024604_tiny + affected files: + results/fastq/ERR024604_tiny_1.fastq.gzresults/fastq/ERR024604_tiny_2.fastq.gz diff --git a/workflow/.snakemake/log/2022-03-15T141432.576962.snakemake.log b/workflow/.snakemake/log/2022-03-15T141432.576962.snakemake.log new file mode 100644 index 0000000..e12ba89 --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T141432.576962.snakemake.log @@ -0,0 +1,7 @@ +Building DAG of jobs... +MissingInputException in line 1 of /Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/rules/bowtie.smk: +Missing input files for rule map: + output: results/sam/ERR024606_tiny.sam + wildcards: sample=ERR024606_tiny + affected files: + results/fastq/ERR024606_tiny_1.fastq.gzresults/fastq/ERR024606_tiny_2.fastq.gz diff --git a/workflow/.snakemake/log/2022-03-15T141436.384821.snakemake.log b/workflow/.snakemake/log/2022-03-15T141436.384821.snakemake.log new file mode 100644 index 0000000..f39f7d9 --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T141436.384821.snakemake.log @@ -0,0 +1,7 @@ +Building DAG of jobs... +MissingInputException in line 1 of /Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/rules/bowtie.smk: +Missing input files for rule map: + output: results/sam/ERR024605_tiny.sam + wildcards: sample=ERR024605_tiny + affected files: + results/fastq/ERR024605_tiny_1.fastq.gzresults/fastq/ERR024605_tiny_2.fastq.gz diff --git a/workflow/.snakemake/log/2022-03-15T141447.281345.snakemake.log b/workflow/.snakemake/log/2022-03-15T141447.281345.snakemake.log new file mode 100644 index 0000000..599925c --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T141447.281345.snakemake.log @@ -0,0 +1,7 @@ +Building DAG of jobs... +MissingInputException in line 1 of /Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/rules/bowtie.smk: +Missing input files for rule map: + output: results/sam/ERR024608_tiny.sam + wildcards: sample=ERR024608_tiny + affected files: + results/fastq/ERR024608_tiny_1.fastq.gzresults/fastq/ERR024608_tiny_2.fastq.gz diff --git a/workflow/.snakemake/log/2022-03-15T141505.214014.snakemake.log b/workflow/.snakemake/log/2022-03-15T141505.214014.snakemake.log new file mode 100644 index 0000000..159fab4 --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T141505.214014.snakemake.log @@ -0,0 +1,8 @@ +Building DAG of jobs... +MissingInputException in line 1 of /Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/rules/bowtie.smk: +Missing input files for rule map: + output: results/sam/ERR024606_tiny.sam + wildcards: sample=ERR024606_tiny + affected files: + results/fastq/ERR024606_tiny_2.fastq.gz + results/fastq/ERR024606_tiny_1.fastq.gz diff --git a/workflow/.snakemake/log/2022-03-15T141509.059492.snakemake.log b/workflow/.snakemake/log/2022-03-15T141509.059492.snakemake.log new file mode 100644 index 0000000..0e148e9 --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T141509.059492.snakemake.log @@ -0,0 +1,8 @@ +Building DAG of jobs... +MissingInputException in line 1 of /Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/rules/bowtie.smk: +Missing input files for rule map: + output: results/sam/ERR024605_tiny.sam + wildcards: sample=ERR024605_tiny + affected files: + results/fastq/ERR024605_tiny_2.fastq.gz + results/fastq/ERR024605_tiny_1.fastq.gz diff --git a/workflow/.snakemake/log/2022-03-15T141559.573733.snakemake.log b/workflow/.snakemake/log/2022-03-15T141559.573733.snakemake.log new file mode 100644 index 0000000..6bbae34 --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T141559.573733.snakemake.log @@ -0,0 +1,8 @@ +Building DAG of jobs... +MissingInputException in line 1 of /Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/rules/bowtie.smk: +Missing input files for rule map: + output: results/sam/ERR024604_tiny.sam + wildcards: sample=ERR024604_tiny + affected files: + results/fastq/ERR024604_tiny_2.fastq.gz + results/fastq/ERR024604_tiny_1.fastq.gz diff --git a/workflow/.snakemake/log/2022-03-15T141603.058242.snakemake.log b/workflow/.snakemake/log/2022-03-15T141603.058242.snakemake.log new file mode 100644 index 0000000..4b3d34f --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T141603.058242.snakemake.log @@ -0,0 +1,8 @@ +Building DAG of jobs... +MissingInputException in line 1 of /Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/rules/bowtie.smk: +Missing input files for rule map: + output: results/sam/ERR024609_tiny.sam + wildcards: sample=ERR024609_tiny + affected files: + results/fastq/ERR024609_tiny_2.fastq.gz + results/fastq/ERR024609_tiny_1.fastq.gz diff --git a/workflow/.snakemake/log/2022-03-15T141609.906141.snakemake.log b/workflow/.snakemake/log/2022-03-15T141609.906141.snakemake.log new file mode 100644 index 0000000..18abd49 --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T141609.906141.snakemake.log @@ -0,0 +1,8 @@ +Building DAG of jobs... +MissingInputException in line 1 of /Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/rules/bowtie.smk: +Missing input files for rule map: + output: results/sam/ERR024605_tiny.sam + wildcards: sample=ERR024605_tiny + affected files: + results/fastq/ERR024605_tiny_1.fastq.gz + results/fastq/ERR024605_tiny_2.fastq.gz diff --git a/workflow/.snakemake/log/2022-03-15T141632.425650.snakemake.log b/workflow/.snakemake/log/2022-03-15T141632.425650.snakemake.log new file mode 100644 index 0000000..18abd49 --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T141632.425650.snakemake.log @@ -0,0 +1,8 @@ +Building DAG of jobs... +MissingInputException in line 1 of /Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/rules/bowtie.smk: +Missing input files for rule map: + output: results/sam/ERR024605_tiny.sam + wildcards: sample=ERR024605_tiny + affected files: + results/fastq/ERR024605_tiny_1.fastq.gz + results/fastq/ERR024605_tiny_2.fastq.gz diff --git a/workflow/.snakemake/log/2022-03-15T141842.449333.snakemake.log b/workflow/.snakemake/log/2022-03-15T141842.449333.snakemake.log new file mode 100644 index 0000000..3c0e492 --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T141842.449333.snakemake.log @@ -0,0 +1,8 @@ +Building DAG of jobs... +MissingInputException in line 1 of /Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/rules/bowtie.smk: +Missing input files for rule map: + output: results/sam/ERR024609_tiny.sam + wildcards: sample=ERR024609_tiny + affected files: + results/fastq/ERR024609_tiny_1.fastq.gz + results/fastq/ERR024609_tiny_2.fastq.gz diff --git a/workflow/.snakemake/log/2022-03-15T142135.708957.snakemake.log b/workflow/.snakemake/log/2022-03-15T142135.708957.snakemake.log new file mode 100644 index 0000000..6bbae34 --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T142135.708957.snakemake.log @@ -0,0 +1,8 @@ +Building DAG of jobs... +MissingInputException in line 1 of /Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/rules/bowtie.smk: +Missing input files for rule map: + output: results/sam/ERR024604_tiny.sam + wildcards: sample=ERR024604_tiny + affected files: + results/fastq/ERR024604_tiny_2.fastq.gz + results/fastq/ERR024604_tiny_1.fastq.gz diff --git a/workflow/.snakemake/log/2022-03-15T142139.848286.snakemake.log b/workflow/.snakemake/log/2022-03-15T142139.848286.snakemake.log new file mode 100644 index 0000000..f896786 --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T142139.848286.snakemake.log @@ -0,0 +1,8 @@ +Building DAG of jobs... +MissingInputException in line 1 of /Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/rules/bowtie.smk: +Missing input files for rule map: + output: results/sam/ERR024606_tiny.sam + wildcards: sample=ERR024606_tiny + affected files: + results/fastq/ERR024606_tiny_1.fastq.gz + results/fastq/ERR024606_tiny_2.fastq.gz diff --git a/workflow/.snakemake/log/2022-03-15T142146.756227.snakemake.log b/workflow/.snakemake/log/2022-03-15T142146.756227.snakemake.log new file mode 100644 index 0000000..159fab4 --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T142146.756227.snakemake.log @@ -0,0 +1,8 @@ +Building DAG of jobs... +MissingInputException in line 1 of /Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/rules/bowtie.smk: +Missing input files for rule map: + output: results/sam/ERR024606_tiny.sam + wildcards: sample=ERR024606_tiny + affected files: + results/fastq/ERR024606_tiny_2.fastq.gz + results/fastq/ERR024606_tiny_1.fastq.gz diff --git a/workflow/.snakemake/log/2022-03-15T143128.835585.snakemake.log b/workflow/.snakemake/log/2022-03-15T143128.835585.snakemake.log new file mode 100644 index 0000000..0e452c8 --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T143128.835585.snakemake.log @@ -0,0 +1,6 @@ +Building DAG of jobs... +MissingInputException in line 3 of /Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/rules/bowtie.smk: +Missing input files for rule refindex: + output: results/reference/index + affected files: + results/reference/reference.fa diff --git a/workflow/.snakemake/log/2022-03-15T143316.866263.snakemake.log b/workflow/.snakemake/log/2022-03-15T143316.866263.snakemake.log new file mode 100644 index 0000000..61d78e4 --- /dev/null +++ b/workflow/.snakemake/log/2022-03-15T143316.866263.snakemake.log @@ -0,0 +1,6 @@ +Building DAG of jobs... +MissingInputException in line 1 of /Users/charlotteseehagen/Documents/Uni/swp-workflows/workflow/rules/bowtie.smk: +Missing input files for rule refindex: + output: results/reference/index + affected files: + results/reference/reference.fa diff --git a/workflow/Snakefile b/workflow/Snakefile new file mode 100644 index 0000000..b2f07fd --- /dev/null +++ b/workflow/Snakefile @@ -0,0 +1,18 @@ +import pandas as pd +configfile: "config/config.yaml" + +samples = pd.read_table(config["samples"], index_col="sample") + + +rule all: + input: + expand("results/stats/{sample}.stats.txt", sample=samples.index), + expand("results/fastqc/{sample}_1_fastqc.html", sample=samples.index), + expand("results/fastqc/{sample}_1_fastqc.zip", sample=samples.index), + expand("results/fastqc/{sample}_2_fastqc.html", sample=samples.index), + expand("results/fastqc/{sample}_2_fastqc.zip", sample=samples.index) +include:"rules/fastqc.smk" + +include:"rules/bowtie.smk" + +include:"rules/samtools.smk" diff --git a/workflow/envs/.DS_Store b/workflow/envs/.DS_Store new file mode 100644 index 0000000000000000000000000000000000000000..5008ddfcf53c02e82d7eee2e57c38e5672ef89f6 GIT binary patch literal 6148 zcmZQzU|@7AO)+F(5MW?n;9!8z45|!R0Z1N%F(jFgL>QrFAPJ2!M?+vV1V%$(Gz3ON zU^D~<VF)ln+{D2Rp-0Kl5Eu=C(GY-#0H}OW0QD6Z7#JL&bOVG2Nii@oFo3%Nj0_Ac zFio(203!nfNGnJUNGpg2X=PvpvA|}4wK6b5wK9UcAq)(R;4TS>25V<v1ltVagS9g- zf^BACV1#IAV1(Mt2<@RTf_gL{^C8+97{Ru~TsKOOhQMeDz(Rl-!Vmz}|E>%SxcdJP zRior+2#kinunYl47MEZbCs3t{!+W4QHvuXKVuPw;Mo^s$(F3lEVT}ML$bg~*R5_@+ b2Uo?6kTwK}57Iu`5P${HC_Nei0}uiLNUI8I literal 0 HcmV?d00001 diff --git a/workflow/envs/yourenv.yaml b/workflow/envs/yourenv.yaml new file mode 100644 index 0000000..fb2f959 --- /dev/null +++ b/workflow/envs/yourenv.yaml @@ -0,0 +1,33 @@ +name: yourenv.yaml +channels: + - bioconda + - defaults +dependencies: + - bowtie2=2.3.5.1=py37h2dec4b4_0 + - c-ares=1.18.1=hca72f7f_0 + - ca-certificates=2022.2.1=hecd8cb5_0 + - certifi=2021.10.8=py37hecd8cb5_2 + - curl=7.80.0=hca72f7f_0 + - krb5=1.19.2=hcd88c3b_0 + - libcurl=7.80.0=h6dfd666_0 + - libcxx=12.0.0=h2f01273_0 + - libedit=3.1.20210910=hca72f7f_0 + - libev=4.33=h9ed2024_1 + - libffi=3.3=hb1e8313_2 + - libnghttp2=1.46.0=ha29bfda_0 + - libssh2=1.9.0=ha12b0ac_1 + - ncurses=6.3=hca72f7f_2 + - openssl=1.1.1m=hca72f7f_0 + - perl=5.26.2=h4e221da_0 + - pip=21.2.2=py37hecd8cb5_0 + - python=3.7.11=h88f2d9e_0 + - readline=8.1.2=hca72f7f_1 + - samtools=1.4.1=0 + - setuptools=58.0.4=py37hecd8cb5_0 + - sqlite=3.37.2=h707629a_0 + - tbb=2021.5.0=haf03e11_0 + - tk=8.6.11=h7bc2e8c_0 + - wheel=0.37.1=pyhd3eb1b0_0 + - xz=5.2.5=h1de35cc_0 + - zlib=1.2.11=h4dc903c_4 +prefix: /Users/charlotteseehagen/opt/anaconda3/envs/yourenv.yaml diff --git a/workflow/rules/bowtie.smk b/workflow/rules/bowtie.smk new file mode 100644 index 0000000..b60c52e --- /dev/null +++ b/workflow/rules/bowtie.smk @@ -0,0 +1,32 @@ +rule refindex: + input: + "results/reference/reference.fa" + params: + prefix=config["index"] + output: + "results/reference/index.bt2" + threads:4 + conda: + "../envs/yourenv.yaml" + shell: + "bowtie2-build {input} {params.prefix} > {output}" + + + +rule map: + input: + "results/reference/index.bt2", + r1 = lambda wildcards: samples.at[wildcards.sample,'fq1'] if wildcards.sample in samples.index else ' ', + r2 = lambda wildcards: samples.at[wildcards.sample,'fq2'] if wildcards.sample in samples.index else ' ' + params: + prefix=config["index"], + bowtieparams=config["bowtieparams"] + output: + "results/sam/{sample}.sam" + log: + "workflow/report/mapping/{sample}.log" + threads:4 + conda: + "../envs/yourenv.yaml" + shell: + "bowtie2 {params.bowtieparams} -x {params.prefix} --threads={threads} -1 {input[1]} -2 {input[2]} > {output} 2> {log}" diff --git a/workflow/rules/fastqc.smk b/workflow/rules/fastqc.smk new file mode 100644 index 0000000..73f9dae --- /dev/null +++ b/workflow/rules/fastqc.smk @@ -0,0 +1,25 @@ +rule rawfastqc1: + input: + rf1 = lambda wildcards: samples.at[wildcards.sample,'fq1'] if wildcards.sample in samples.index else ' ' + output: + html="results/fastqc/{sample}_1_fastqc.html", + zip="results/fastqc/{sample}_1_fastqc.zip" + conda: + "../envs/yourenv.yaml" + log: + "workflow/report/fastqc/{sample}.log" + wrapper: + "v1.3.1/bio/fastqc" + +rule rawfastqc2: + input: + rf2 = lambda wildcards: samples.at[wildcards.sample,'fq2'] if wildcards.sample in samples.index else ' ' + output: + html="results/fastqc/{sample}_2_fastqc.html", + zip="results/fastqc/{sample}_2_fastqc.zip" + conda: + "../envs/yourenv.yaml" + log: + "workflow/report/fastqc/{sample}.log" + wrapper: + "v1.3.1/bio/fastqc" diff --git a/workflow/rules/samtools.smk b/workflow/rules/samtools.smk new file mode 100644 index 0000000..dc63db9 --- /dev/null +++ b/workflow/rules/samtools.smk @@ -0,0 +1,49 @@ +rule convert: + input: + "results/sam/{sample}.sam" + output: + "results/bam/{sample}.bam" + threads:4 + conda: + "../envs/yourenv.yaml" + shell: + "samtools view -S -b --threads={threads} {input} > {output}" + + +rule sort: + input: + "results/bam/{sample}.bam" + output: + "results/bam_sorted/{sample}.sorted.bam" + log: + "workflow/report/sort/{sample}.log" + threads:4 + conda: + "../envs/yourenv.yaml" + shell: + "samtools sort --threads={threads} {input} > {output} 2> {log}" + + +rule index: + input: + "results/bam_sorted/{sample}.sorted.bam" + output: + "results/bam_sorted/{sample}.sorted.bam.bai" + threads:4 + conda: + "../envs/yourenv.yaml" + shell: + "samtools index -@ {threads} {input}" + + +rule stats: + input: + "results/bam_sorted/{sample}.sorted.bam", + "results/bam_sorted/{sample}.bam.bai" + output: + "results/stats/{sample}.stats.txt" + threads:4 + conda: + "../envs/yourenv.yaml" + shell: + "samtools idxstats --threads={threads} {input[0]} > {output}" diff --git a/workflow/rules/trimming.smk b/workflow/rules/trimming.smk new file mode 100644 index 0000000..9ee44de --- /dev/null +++ b/workflow/rules/trimming.smk @@ -0,0 +1,8 @@ +rule trimming: + input: + rt1 = lambda wildcards: samples.at[wildcards.sample,'fq1'] if wildcards.sample in samples.index else ' ', + rt2 = lambda wildcards: samples.at[wildcards.sample,'fq2'] if wildcards.sample in samples.index else ' ' + output: + "results/trimmed/{sample}.fq.gz" + shell: + "java -jar trimmomatic-0.39.jar PE {input[0]} {input[1]} {output} ILLUMINACLIP:TruSeq3-PE.fa:2:30:10:2:True LEADING:3 TRAILING:3 MINLEN:36" -- GitLab