From 8793fa4ac786a2542eb49ff02c5e86b99a3fd8e3 Mon Sep 17 00:00:00 2001
From: mariabernard <maria.bernard@jouy.inra.fr>
Date: Fri, 7 Jun 2019 09:17:09 +0200
Subject: [PATCH] 1000RNASeq_chicken ASE : perform rmdup for single end read

---
 Snakemake/1000RNASeq_chicken/ASE/Snakefile       |  4 ++--
 .../1000RNASeq_chicken/ASE/rules/ASE_counter.smk |  2 +-
 Snakemake/1000RNASeq_chicken/ASE/rules/STAR.smk  | 16 ++++++++--------
 3 files changed, 11 insertions(+), 11 deletions(-)

diff --git a/Snakemake/1000RNASeq_chicken/ASE/Snakefile b/Snakemake/1000RNASeq_chicken/ASE/Snakefile
index 78851bb..b10780e 100644
--- a/Snakemake/1000RNASeq_chicken/ASE/Snakefile
+++ b/Snakemake/1000RNASeq_chicken/ASE/Snakefile
@@ -130,7 +130,7 @@ for sample in table["sample_name"].unique():
 	    final_outputs.append("Results/STAR_Aln_2/" + sample + "_rg_genomic_pp_rmdup_uniq_split.bam")
 	# single end, no filter on properly paired
 	elif len(sample_table["reverse_read"].dropna() ) == 0:
-	    final_outputs.append("Results/STAR_Aln_2/" + sample + "_rg_genomic_uniq_split.bam")
+	    final_outputs.append("Results/STAR_Aln_2/" + sample + "_rg_genomic_rmdup_uniq_split.bam")
 
 # # counter
 for sample in table["sample_name"].unique():
@@ -146,4 +146,4 @@ for sample in table["sample_name"].unique():
 
 rule all:
     input:
-        final_outputs
\ No newline at end of file
+        final_outputs
diff --git a/Snakemake/1000RNASeq_chicken/ASE/rules/ASE_counter.smk b/Snakemake/1000RNASeq_chicken/ASE/rules/ASE_counter.smk
index d91340a..b239bb5 100644
--- a/Snakemake/1000RNASeq_chicken/ASE/rules/ASE_counter.smk
+++ b/Snakemake/1000RNASeq_chicken/ASE/rules/ASE_counter.smk
@@ -18,7 +18,7 @@ def get_splitNCigar_bam(wildcards):
         return "Results/STAR_Aln_2/" + wildcards.sample + "_rg_genomic_pp_rmdup_uniq_split.bam"
     # single end, no filter
     elif len(sample_table["reverse_read"].dropna() ) == 0:
-        return "Results/STAR_Aln_2/" + wildcards.sample + "_rg_genomic_uniq_split.bam"
+        return "Results/STAR_Aln_2/" + wildcards.sample + "_rg_genomic_rmdup_uniq_split.bam"
     else :
     	raise Exception(wildcards.sample + " is sequenced in pair end & single end mode\n 	This workflow do not accept this case!\n")
 
diff --git a/Snakemake/1000RNASeq_chicken/ASE/rules/STAR.smk b/Snakemake/1000RNASeq_chicken/ASE/rules/STAR.smk
index cc55d4b..8df1b00 100644
--- a/Snakemake/1000RNASeq_chicken/ASE/rules/STAR.smk
+++ b/Snakemake/1000RNASeq_chicken/ASE/rules/STAR.smk
@@ -8,7 +8,7 @@ Align RNASeq reads on masked genome
 '''
 
 wildcard_constraints:
-    properlyPaired_rmDup = '_pp_rmdup_|_'
+    properlyPaired_rmDup = '_pp_|_'
 
 STAR_INDEX_FILE=['genomeParameters.txt', 'chrName.txt', 'chrLength.txt', 'chrStart.txt', 'chrNameLength.txt', 'exonGeTrInfo.tab', 'geneInfo.tab', 'transcriptInfo.tab', 'exonInfo.tab', 'sjdbList.fromGTF.out.tab', 'sjdbInfo.txt', 'sjdbList.out.tab', 'Genome', 'SA', 'SAindex']
 
@@ -161,8 +161,8 @@ rule rmdup:
     input:
         bam = get_properly_paired_bam
     output:
-        bam = "Results/STAR_Aln_2/{sample}_rg_genomic{properlyPaired_rmDup}.bam",
-        metrics = "Results/STAR_Aln_2/{sample}_rg_genomic{properlyPaired_rmDup}.metrics.txt",
+        bam = "Results/STAR_Aln_2/{sample}_rg_genomic{properlyPaired}.bam",
+        metrics = "Results/STAR_Aln_2/{sample}_rg_genomic{properlyPaired}.metrics.txt",
     params:
         mem=str(int(config["rmdup"]["mem"].replace("G","")) -4 )+"G" if int(config["rmdup"]["mem"].replace("G","")) -4 > 1 else config["rmdup"]["mem"] ,
         jar=find_jar("picard.jar")
@@ -173,9 +173,9 @@ rule rmdup:
 
 rule remove_multimap:
     input:
-        bam = "Results/STAR_Aln_2/{sample}_rg_genomic{properlyPaired_rmDup}.bam"
+        bam = "Results/STAR_Aln_2/{sample}_rg_genomic{properlyPaired}rmdup.bam"
     output:
-        bam = "Results/STAR_Aln_2/{sample}_rg_genomic{properlyPaired_rmDup}uniq.bam"
+        bam = "Results/STAR_Aln_2/{sample}_rg_genomic{properlyPaired}rmdup_uniq.bam"
     shell:
         """
         samtools view -h -q 255 {input.bam} -bo {output.bam} 
@@ -184,9 +184,9 @@ rule remove_multimap:
 rule SplitNCigarReads:
     input:
         fasta = 'Results/genomeMasked/' + os.path.splitext(os.path.basename(config['fasta_ref']))[0] + '_masked.fa', 
-        bam = "Results/STAR_Aln_2/{sample}_rg_genomic{properlyPaired_rmDup}uniq.bam"
+        bam = "Results/STAR_Aln_2/{sample}_rg_genomic{properlyPaired}rmdup_uniq.bam"
     output:
-        bam = "Results/STAR_Aln_2/{sample}_rg_genomic{properlyPaired_rmDup}uniq_split.bam"
+        bam = "Results/STAR_Aln_2/{sample}_rg_genomic{properlyPairedrmdup_uniq_split.bam"
     params:
         mem=config["SplitNCigarReads"]["mem"],
         jar=find_jar("GenomeAnalysisTK.jar")
@@ -194,4 +194,4 @@ rule SplitNCigarReads:
         """
         java -Xmx{params.mem} -jar {params.jar} -T SplitNCigarReads -R {input.fasta} -I {input.bam} -o {output.bam} -rf ReassignOneMappingQuality -RMQF 255 -RMQT 60 -U ALLOW_N_CIGAR_READS 
         """
-    
\ No newline at end of file
+    
-- 
GitLab