From 92a8ed7ec81eb15598c2fd0cff2cc74d38340c95 Mon Sep 17 00:00:00 2001 From: peguerin <pierre-edouard.guerin@cefe.cnrs.fr> Date: Tue, 30 Oct 2018 14:06:27 +0100 Subject: [PATCH] adapters trimming --- 00-scripts/step1.sf | 8 ++++++-- 01-info_files/config.yaml | 10 +++++++--- main.sh | 3 +-- 3 files changed, 14 insertions(+), 7 deletions(-) diff --git a/00-scripts/step1.sf b/00-scripts/step1.sf index 580f2e4..43d27f8 100644 --- a/00-scripts/step1.sf +++ b/00-scripts/step1.sf @@ -19,14 +19,18 @@ rule process_radtags: enzyme=config["process_radtags"]["enzyme"], trim_length=config["process_radtags"]["trim_length"], score_limit=config["process_radtags"]["score_limit"], + windows_size=config["process_radtags"]["sliding_windows_size"], + adapter_mm=config["process_radtags"]["adapter_mm"], encoded=config["process_radtags"]["encoded"], - barcode_dist_1=config["process_radtags"]["barcode_dist_1"] + adapter_1=config["process_radtags"]["adapter_1"], + adapter_2=config["process_radtags"]["adapter_2"], + barcode_dist_1=config["process_radtags"]["barcode_dist_1"], barcode_dist_2=config["process_radtags"]["barcode_dist_2"] log: '10-logs/process_radtags/{runpool}.log' shell: '''mkdir -p {output}; - process_radtags -i gzfastq -P -p {input} -o {output} -b 01-info_files/barcodes.txt -c -r -t {params.trim_length} --barcode_dist_1 {params.barcode_dist_1} --barcode_dist_2 {params.barcode_dist_2} -s {params.score_limit} -E {params.encoded} -e {params.enzyme} 2> {log}''' + process_radtags -i gzfastq -P -p {input} -o {output} -b 01-info_files/barcodes.txt -c -r -t {params.trim_length} --adapter_mm {params.adapter_mm} --adapter_1 {params.adapter_1} --adapter_2 {params.adapter_2} --barcode_dist_1 {params.barcode_dist_1} --barcode_dist_2 {params.barcode_dist_2} -w {params.windows_size} -s {params.score_limit} -E {params.encoded} -e {params.enzyme} 2> {log}''' ### clone filter rule clone_filter: diff --git a/01-info_files/config.yaml b/01-info_files/config.yaml index 3cba3df..539d00a 100644 --- a/01-info_files/config.yaml +++ b/01-info_files/config.yaml @@ -1,10 +1,14 @@ process_radtags: enzyme : SbfI - trim_length : 143 + trim_length : 142 score_limit : 20 + sliding_windows_size : 0.20 encoded : phred33 - barcode_dist_1 : 2 - barcode_dist_2 : 2 + barcode_dist_1 : 1 + barcode_dist_2 : 1 + adapter_mm : 2 + adapter_1 : ACACTCTTTCCCTACACGACGCTCTTCCGATCT,AGATCGGAAGAGCGTCGTGTAGGGAAAGAGTGT,GATCGGAAGAGCGGTTCAGCAGGAATGCCGAGACCGATCAGAACAA,CAAGCAGAAGACGGCATACGAGATCGGTCTCGGCATTCCTGCTGAACCGCTCTTCC + adapter_2 : ACACTCTTTCCCTACACGACGCTCTTCCGATCT,AGATCGGAAGAGCGTCGTGTAGGGAAAGAGTGT,GATCGGAAGAGCGGTTCAGCAGGAATGCCGAGACCGATCAGAACAA,CAAGCAGAAGACGGCATACGAGATCGGTCTCGGCATTCCTGCTGAACCGCTCTTCC species: - mullus - serran diff --git a/main.sh b/main.sh index 4dd9cf2..24ec551 100644 --- a/main.sh +++ b/main.sh @@ -11,7 +11,6 @@ if [[ -z $check_already_indexed ]]; then snakemake -s 00-scripts/step2.sf -j $CORES fi ## assign (run, pool, barcode) to individual according to _infos.csv file and align them onto the genome -snakemake -s 00-scripts/step3.sf -j $CORES +snakemake -s 00-scripts/step3.sf -j $CORES -F ## run STACKS2 programs : gstacks & populations snakemake -s 00-scripts/step4.sf -j $CORES - -- GitLab