From 95f70fe7a1ba9eacb086560f075d8db2a561a0ee Mon Sep 17 00:00:00 2001
From: Valentina Galata <valentina.galata@uni.lu>
Date: Thu, 2 Jul 2020 12:58:39 +0200
Subject: [PATCH] workflow: rm partial gene counts rule from analysis (issue
 #50)

---
 workflow/rules/analysis.smk | 26 --------------------------
 workflow/steps/analysis.smk |  4 ----
 2 files changed, 30 deletions(-)

diff --git a/workflow/rules/analysis.smk b/workflow/rules/analysis.smk
index 07b63ec..b457cd9 100644
--- a/workflow/rules/analysis.smk
+++ b/workflow/rules/analysis.smk
@@ -26,23 +26,6 @@ rule analysis_quast:
 ##################################################
 # Proteins
 
-# Number of partial genes
-rule analysis_prodigal_partial:
-    input:
-        os.path.join(RESULTS_DIR, "annotation/prodigal/{rtype}/{tool}/proteins.faa")
-    output:
-        os.path.join(RESULTS_DIR, "annotation/prodigal/{rtype}/{tool}/partial_gene_counts.txt")
-    wildcard_constraints:
-        rtype="|".join(READ_TYPES),
-        tool="|".join(ASSEMBLERS)
-    threads: 1
-    message:
-        "Count partial genes in {input}"
-    shell:
-        "grep -E -o 'partial.{{0,3}}' {input} | grep '10\|01\|11' | wc -l > {output}"
-
-# TODO: summary for tables/figures: separate *.smk
-
 # for CD-HIT
 rule analysis_bbmap_rename:
     input:
@@ -93,15 +76,6 @@ rule analysis_cdhit:
         "cd-hit-2d -i {input.faa2} -i2 {input.faa1} -o {output.faa21} -c 0.9 -n 5 -d 0 -M 16000 -T 8 && "
         "date) 2> {log.err} > {log.out}"
 
-# TODO: summary for tables/figures: separate *.smk
-# """
-# cd-hit-2d -i {input.co1} -i2 {input.co2} -o {output.form1} -c 0.9 -n 5 -d 0 -M 16000 -T 8 &&\
-# cd-hit-2d -i {input.co2} -i2 {input.co1} -o {output.form2} -c 0.9 -n 5 -d 0 -M 16000 -T 8 &&\
-# echo {output.form1} > tmp && grep -c '>' {output.form1} >> tmp &&\
-# echo {output.form2} >> tmp && grep -c '>' {output.form2} >> tmp &&\
-# cat tmp | paste - - > {output.form3}
-# """
-
 ##################################################
 # MMseqs2
 
diff --git a/workflow/steps/analysis.smk b/workflow/steps/analysis.smk
index 144d642..b72948c 100644
--- a/workflow/steps/analysis.smk
+++ b/workflow/steps/analysis.smk
@@ -24,10 +24,6 @@ rule ANALYSIS_ASSEMBLY:
 
 rule ANALYSIS_PROTEINS:
     input:
-        expand(
-            os.path.join(RESULTS_DIR, "annotation/prodigal/{rtype_tool}/partial_gene_counts.txt"),
-            rtype_tool=["%s/%s" % (rtype, tool) for rtype, tool in READ_ASSEMBLERS]
-        ),
         expand(
             os.path.join(RESULTS_DIR, "analysis/cdhit/{combi}.faa"),
             combi=["%s_%s__%s_%s" % (p[0][0], p[0][1], p[1][0], p[1][1]) for p in READ_ASSEMBLER_PAIRS]
-- 
GitLab