Skip to content
Snippets Groups Projects
Commit 8b3024b7 authored by james94's avatar james94
Browse files

build hifi changes

parent 25d6b9be
No related branches found
No related tags found
No related merge requests found
...@@ -3,12 +3,12 @@ localrules: symlinkUnzippedHifi, symlinkfornotSmartTrimmed, multiqc_hifi ...@@ -3,12 +3,12 @@ localrules: symlinkUnzippedHifi, symlinkfornotSmartTrimmed, multiqc_hifi
def fq_to_trimSMRTbell(wildcards): # def fq_to_trimSMRTbell(wildcards):
return trimSMRTbell.loc[(wildcards.sample, wildcards.readCounter), "hifi_reads"] # return trimSMRTbell.loc[(wildcards.sample, wildcards.readCounter), "hifi_reads"]
#
#
def fq_to_notTrimSMRTbell(wildcards): # def fq_to_notTrimSMRTbell(wildcards):
return notrimSMRTbell.loc[(wildcards.sample, wildcards.readCounter), "hifi_reads"] # return notrimSMRTbell.loc[(wildcards.sample, wildcards.readCounter), "hifi_reads"]
def hifi_gzipped(wildcards): def hifi_gzipped(wildcards):
...@@ -24,7 +24,7 @@ rule unzipHifi: ...@@ -24,7 +24,7 @@ rule unzipHifi:
input: input:
fastq=hifi_gzipped, fastq=hifi_gzipped,
output: output:
temp(os.path.join(config['Results'], "0_buildDatabases/{sample}/hifiReads/01_unzipFastqs/{readCounter}.{smrtornot}.fastq")), os.path.join(config['Results'], "0_buildDatabases/{sample}/hifiReads/temp_unzipFastqs/{readCounter}.{smrtornot}.fastq"),
log: log:
os.path.join(config['Results'], "0_buildDatabases/{sample}/logs/hifiReads/{readCounter}.{smrtornot}_pigzUnzip.log") os.path.join(config['Results'], "0_buildDatabases/{sample}/logs/hifiReads/{readCounter}.{smrtornot}_pigzUnzip.log")
conda: conda:
...@@ -43,7 +43,7 @@ rule symlinkUnzippedHifi: ...@@ -43,7 +43,7 @@ rule symlinkUnzippedHifi:
input: input:
fastq=hifi_notgzipped, fastq=hifi_notgzipped,
output: output:
temp(os.path.join(config['Results'], "0_buildDatabases/{sample}/hifiReads/01_unzipFastqs/{readCounter}.{smrtornot}.fastq")), os.path.join(config['Results'], "0_buildDatabases/{sample}/hifiReads/temp_unzipFastqs/{readCounter}.{smrtornot}.fastq"),
log: log:
os.path.join(config['Results'], "0_buildDatabases/{sample}/logs/hifiReads/{readCounter}.{smrtornot}_pigzUnzip.log") os.path.join(config['Results'], "0_buildDatabases/{sample}/logs/hifiReads/{readCounter}.{smrtornot}_pigzUnzip.log")
container: container:
...@@ -56,9 +56,9 @@ rule symlinkUnzippedHifi: ...@@ -56,9 +56,9 @@ rule symlinkUnzippedHifi:
rule trimSMRTbell: rule trimSMRTbell:
input: input:
os.path.join(config['Results'], "0_buildDatabases/{sample}/hifiReads/01_unzipFastqs/{readCounter}.smrtTrimmed.fastq"), os.path.join(config['Results'], "0_buildDatabases/{sample}/hifiReads/temp_unzipFastqs/{readCounter}.smrtTrimmed.fastq"),
output: output:
outputFile=temp(os.path.join(config['Results'],"0_buildDatabases/{sample}/hifiReads/02_trimReads/{readCounter}.smrtTrimmed.fastq")) outputFile=os.path.join(config['Results'],"0_buildDatabases/{sample}/hifiReads/temp_trimReads/{readCounter}.smrtTrimmed.fastq")
threads: threads:
resource['trimSMRTbell']['threads'] resource['trimSMRTbell']['threads']
resources: resources:
...@@ -77,9 +77,9 @@ rule trimSMRTbell: ...@@ -77,9 +77,9 @@ rule trimSMRTbell:
rule symlinkfornotSmartTrimmed: rule symlinkfornotSmartTrimmed:
input: input:
os.path.join(config['Results'], "0_buildDatabases/{sample}/hifiReads/01_unzipFastqs/{readCounter}.notsmrtTrimmed.fastq"), os.path.join(config['Results'], "0_buildDatabases/{sample}/hifiReads/temp_unzipFastqs/{readCounter}.notsmrtTrimmed.fastq"),
output: output:
outputFile=temp(os.path.join(config['Results'],"0_buildDatabases/{sample}/hifiReads/02_trimReads/{readCounter}.notsmrtTrimmed.fastq")) outputFile=os.path.join(config['Results'],"0_buildDatabases/{sample}/hifiReads/temp_trimReads/{readCounter}.notsmrtTrimmed.fastq")
container: container:
None None
shell: shell:
...@@ -89,11 +89,11 @@ rule symlinkfornotSmartTrimmed: ...@@ -89,11 +89,11 @@ rule symlinkfornotSmartTrimmed:
rule fastqc_hifi: rule fastqc_hifi:
input: input:
os.path.join(config['Results'],"0_buildDatabases/{sample}/hifiReads/02_trimReads/{readCounter}.{smrtornot}.fastq") os.path.join(config['Results'],"0_buildDatabases/{sample}/hifiReads/temp_trimReads/{readCounter}.{smrtornot}.fastq")
params: params:
folder2out=os.path.join(config['Results'],"0_buildDatabases/{sample}/hifiReads/05_multiqc/") folder2out=os.path.join(config['Results'],"0_buildDatabases/{sample}/hifiReads/QC/fastqc")
output: output:
os.path.join(config['Results'],"0_buildDatabases/{sample}/hifiReads/05_multiqc/{readCounter}.{smrtornot}_fastqc.html") os.path.join(config['Results'],"0_buildDatabases/{sample}/hifiReads/QC/fastqc/{readCounter}.{smrtornot}_fastqc.html")
threads: threads:
resource['trimSMRTbell']['threads'] resource['trimSMRTbell']['threads']
resources: resources:
...@@ -105,29 +105,29 @@ rule fastqc_hifi: ...@@ -105,29 +105,29 @@ rule fastqc_hifi:
os.path.join(workflow.basedir, "envs/pigz.yaml") os.path.join(workflow.basedir, "envs/pigz.yaml")
shell: shell:
""" """
mkdir {params.folder2out}
(fastqc {input} -o {params.folder2out} -t {threads}) &> {log} (fastqc {input} -o {params.folder2out} -t {threads}) &> {log}
""" """
rule multiqc_hifi: rule multiqc_hifi:
input: input:
lambda wildcards: expand(os.path.join(config['Results'],"0_buildDatabases/{sample}/hifiReads/05_multiqc/{readCounter}.{smrtornot}_fastqc.html"), sample=wildcards.sample, readCounter=dictReadCounter[wildcards.sample], smrtornot=dictSamples[wildcards.sample][1]) lambda wildcards: expand(os.path.join(config['Results'],"0_buildDatabases/{sample}/hifiReads/QC/fastqc/{readCounter}.{smrtornot}_fastqc.html"), sample=wildcards.sample, readCounter=dictReadCounter[wildcards.sample], smrtornot=dictSamples[wildcards.sample][1])
params: params:
folder2qc=os.path.join(config['Results'],"0_buildDatabases/{sample}/hifiReads/05_multiqc/"), folder2qc=os.path.join(config['Results'],"0_buildDatabases/{sample}/hifiReads/QC/fastqc/"),
filename="{sample}.{smrtornot}.multiqcReport.html" folder2OUT=os.path.join(config['Results'],"0_buildDatabases/{sample}/hifiReads/QC/multiqc/"),
filename="{sample}.multiqcReport.html"
output: output:
os.path.join(config['Results'],"0_buildDatabases/{sample}/hifiReads/05_multiqc/{sample}.{smrtornot}.multiqcReport.html") os.path.join(config['Results'],"0_buildDatabases/{sample}/hifiReads/QC/multiqc/{sample}.multiqcReport.html")
log: log:
os.path.join(config['Results'], "0_buildDatabases/{sample}/hifiReads/logs/{sample}.{smrtornot}.multiqc.log") os.path.join(config['Results'], "0_buildDatabases/{sample}/hifiReads/logs/{sample}.multiqc.log")
conda: conda:
os.path.join(workflow.basedir, "envs/pigz.yaml") os.path.join(workflow.basedir, "envs/pigz.yaml")
shell: shell:
"(multiqc {params.folder2qc} -o {params.folder2qc} -n {params.filename}) &> {log}" "(multiqc {params.folder2qc} -o {params.folder2OUT} -n {params.filename}) &> {log}"
rule meryl_hifi_count: rule meryl_hifi_count:
input: input:
reads=os.path.join(config['Results'],"0_buildDatabases/{sample}/hifiReads/02_trimReads/{readCounter}.{smrtornot}.fastq") reads=os.path.join(config['Results'],"0_buildDatabases/{sample}/hifiReads/temp_trimReads/{readCounter}.{smrtornot}.fastq")
params: params:
kmer = "{kmer}" kmer = "{kmer}"
threads: threads:
...@@ -136,7 +136,7 @@ rule meryl_hifi_count: ...@@ -136,7 +136,7 @@ rule meryl_hifi_count:
mem_mb=resource['meryl_hifi_count']['mem_mb'], mem_mb=resource['meryl_hifi_count']['mem_mb'],
time=resource['meryl_hifi_count']['time'], time=resource['meryl_hifi_count']['time'],
output: output:
temp(directory(os.path.join(config['Results'], "0_buildDatabases/{sample}/hifiReads/03_merylDb/" + "{readCounter}" + "_hifi_dB.{smrtornot}.{kmer}.meryl"))), temp(directory(os.path.join(config['Results'], "0_buildDatabases/{sample}/hifiReads/merylDb/" + "{readCounter}" + "_hifi_dB.{smrtornot}.{kmer}.meryl"))),
log: log:
os.path.join(config['Results'], "0_buildDatabases/{sample}/hifiReads/logs/{readCounter}_hifi_{kmer}.{smrtornot}.log") os.path.join(config['Results'], "0_buildDatabases/{sample}/hifiReads/logs/{readCounter}_hifi_{kmer}.{smrtornot}.log")
priority: priority:
...@@ -150,18 +150,20 @@ rule meryl_hifi_count: ...@@ -150,18 +150,20 @@ rule meryl_hifi_count:
rule meryl_hifi_build: rule meryl_hifi_build:
input: input:
lambda wildcards: expand(os.path.join(config['Results'],"0_buildDatabases/{sample}/hifiReads/03_merylDb/{readCounter}_hifi_dB.{smrtornot}.{kmer}.meryl/"), sample=wildcards.sample, readCounter=dictReadCounter[wildcards.sample], kmer=dictSamples[wildcards.sample][0], smrtornot=dictSamples[wildcards.sample][1]) lambda wildcards: expand(os.path.join(config['Results'],"0_buildDatabases/{sample}/hifiReads/merylDb/{readCounter}_hifi_dB.{smrtornot}.{kmer}.meryl/"), sample=wildcards.sample, readCounter=dictReadCounter[wildcards.sample], kmer=dictSamples[wildcards.sample][0], smrtornot=dictSamples[wildcards.sample][1])
params: params:
kmer = "{kmer}" kmer = "{kmer}",
removeReadDIR_trimmed=os.path.join(config['Results'],"0_buildDatabases/{sample}/hifiReads/temp_trimReads/"),
removeReadDIR_unzipped=os.path.join(config['Results'],"0_buildDatabases/{sample}/hifiReads/temp_unzipFastqs/")
threads: threads:
resource['meryl_hifi_build']['threads'] resource['meryl_hifi_build']['threads']
resources: resources:
mem_mb=resource['meryl_hifi_build']['mem_mb'], mem_mb=resource['meryl_hifi_build']['mem_mb'],
time=resource['meryl_hifi_build']['time'], time=resource['meryl_hifi_build']['time'],
output: output:
directory(os.path.join(config['Results'], "0_buildDatabases/{sample}/hifiReads/03_merylDb/complete_hifi_{sample}_dB.{smrtornot}.{kmer}.meryl")), directory(os.path.join(config['Results'], "0_buildDatabases/{sample}/hifiReads/merylDb/complete_hifi.{sample}.{kmer}.meryl")),
log: log:
os.path.join(config['Results'], "0_buildDatabases/{sample}/hifiReads/logs/{sample}_hifi_{smrtornot}.{kmer}.log") os.path.join(config['Results'], "0_buildDatabases/{sample}/hifiReads/logs/{sample}.meryl_hifi.{kmer}.log")
priority: priority:
10 10
conda: conda:
...@@ -169,4 +171,6 @@ rule meryl_hifi_build: ...@@ -169,4 +171,6 @@ rule meryl_hifi_build:
shell: shell:
""" """
(meryl union-sum {input} output {output}) &> {log} (meryl union-sum {input} output {output}) &> {log}
rm -r {params.removeReadDIR_trimmed}
rm -r {params.removeReadDIR_unzipped}
""" """
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Please register or to comment