From 97fd01f393c2354f4dc52f0700a951399b92a8fc Mon Sep 17 00:00:00 2001
From: Peter van 't Hof <p.j.van_t_hof@lumc.nl>
Date: Tue, 3 Jun 2014 11:42:56 +0200
Subject: [PATCH] Changed to make it compatible for new file structure

---
 .../flexiprep/scripts/summarize_flexiprep.py       | 14 +++++++++-----
 1 file changed, 9 insertions(+), 5 deletions(-)

diff --git a/flexiprep/scripts/nl/lumc/sasc/biopet/pipelines/flexiprep/scripts/summarize_flexiprep.py b/flexiprep/scripts/nl/lumc/sasc/biopet/pipelines/flexiprep/scripts/summarize_flexiprep.py
index ce0723be8..cdf952472 100755
--- a/flexiprep/scripts/nl/lumc/sasc/biopet/pipelines/flexiprep/scripts/summarize_flexiprep.py
+++ b/flexiprep/scripts/nl/lumc/sasc/biopet/pipelines/flexiprep/scripts/summarize_flexiprep.py
@@ -116,7 +116,7 @@ def clip2dict(sample, samplea, sampleb, lib_type, run_dir):
 
     def get_sync_stats(sample):
         stats = {}
-        with open_result(sample + '.clipsync.stats') as src:
+        with open_result(sample + '.clip.sync.stats') as src:
             sync_txt = src.read()
 
         stats['num_reads_discarded_1'] = int(re.search(re_disc_1, sync_txt).group(1))
@@ -146,15 +146,19 @@ def clip2dict(sample, samplea, sampleb, lib_type, run_dir):
     return clip_stats
 
 
-def sickle2dict(run_name, lib_type, run_dir):
+def sickle2dict(run_name, qc_mode, lib_type, run_dir):
 
     trim_stats = {}
+    if qc_mode == 'trim':
+        stat_mark = '.trim.stats'
+    else:
+        stat_mark = '.clip.sync.trim.stats'
 
     if lib_type == 'paired':
         re_paired_kept = re.compile(r'paired records kept: \d+ \((\d+) pairs\)')
         re_disc = re.compile(r'single records discarded: \d+ \(from PE1: (\d+), from PE2: (\d+)\)')
         re_disc_paired = re.compile(r'paired records discarded: \d+ \((\d+) pairs\)')
-        with open(os.path.join(run_dir, run_name + '.filtersync.stats')) as src:
+        with open(os.path.join(run_dir, run_name + stat_mark)) as src:
             sickle_txt = src.read()
 
         discarda = int(re.search(re_disc, sickle_txt).group(1))
@@ -170,7 +174,7 @@ def sickle2dict(run_name, lib_type, run_dir):
     else:
         re_kept = re.compile(r'records kept: (\d+)')
         re_disc = re.compile(r'records discarded: (\d+)')
-        with open(os.path.join(run_dir, run_name + '.filtersync.stats')) as src:
+        with open(os.path.join(run_dir, run_name + stat_mark)) as src:
             sickle_txt = src.read()
 
         trim_stats['num_reads_kept'] = int(re.search(re_kept, sickle_txt).group(1))
@@ -399,7 +403,7 @@ def summarize_flexiprep(run_name, qc_mode, samplea, sampleb, outf, run_dir):
         sumd['stats']['clip'] = clip2dict(run_name, samplea, sampleb, lib_type, run_dir)
 
     if 'trim' in qc_mode:
-        sumd['stats']['trim'] = sickle2dict(run_name, lib_type, run_dir)
+        sumd['stats']['trim'] = sickle2dict(run_name, qc_mode, lib_type, run_dir)
 
     dict2json(sumd, outf)
 
-- 
GitLab