19
19
# basedir
20
20
# reference (hg19, dmd transcript)
21
21
22
- def makeSpliceTrapScripts (basedir , samples , reference , readsize , cutoff , outputFilePrefix ):
22
+ def makeSpliceTrapScripts (basedir , samples , reference , readsize , cutoff ):
23
23
24
24
#transcriptIndex = '/share/apps/richard/kallisto/kallisto_linux-v0.42.5/index/ensembl_GRCh37_transcripts_index'
25
25
transcriptIndex = reference
26
26
numThreads = 4
27
27
for samp in samples :
28
- # hack to decompress fastq.gz on the fly
28
+ # hack to decompress fastq.gz on the fly, does not work
29
29
#read1 = "<(gunzip -c " + os.path.join(basedir, samp, "00-raw", samp + "_1.fastq.gz") + ")"
30
30
#read2 = "<(gunzip -c " + os.path.join(basedir, samp, "00-raw", samp + "_2.fastq.gz") + ")"
31
+
32
+ # need to check if fastq is GZIPPED and uncompress first if so
31
33
read1 = os .path .join (basedir , samp , "00-raw" , samp + "_1.fastq" )
32
34
read2 = os .path .join (basedir , samp , "00-raw" , samp + "_2.fastq" )
35
+
36
+ if not os .path .isfile (read1 ):
37
+ read1gz = os .path .join (basedir , samp , "00-raw" , samp + "_1.fastq.gz" )
38
+ read2gz = os .path .join (basedir , samp , "00-raw" , samp + "_2.fastq.gz" )
39
+ cmdtxt = "gunzip -c " + read1gz + " > " + os .path .join (basedir , samp , "00-raw" , samp + "_1.fastq" ) + "\n "
40
+ cmdtxt += "gunzip -c " + read2gz + " > " + os .path .join (basedir , samp , "00-raw" , samp + "_2.fastq" ) + "\n "
41
+
33
42
outputdir = os .path .join (basedir , samp , "05-splicetrap" )
34
43
if not os .path .exists (outputdir ):
35
44
os .makedirs (outputdir )
45
+ outputFilePrefix = samp
36
46
37
47
nameOfJob = samp + "splicetrap"
38
48
sj = SpliceTrap (readsize ,
@@ -45,19 +55,21 @@ def makeSpliceTrapScripts(basedir, samples, reference, readsize, cutoff, outputF
45
55
nameOfJob ,
46
56
reference
47
57
)
48
- cmdtxt = sj .makeCommand ()
58
+ cmdtxt += sj .makeCommand ()
59
+
49
60
print cmdtxt
50
61
51
62
qsub = SGE (samp , "/home/rwang/rtwcode/rnaseq_tools/templates/qsub_tophat.tmpl" )
52
63
args = {'command' :cmdtxt , 'jobname' : str (samp )+ "splicetrap" , 'jobmem' :'20G' , 'logfilename' : "_" .join ([str (samp ), "splicetrap.log" ])}
53
64
outscript = os .path .join (basedir , samp , str (samp ) + "_splicetrap" + ".sh" )
54
65
print outscript
55
66
qsub .createJobScript (outscript , ** args )
67
+ cmdtxt = ""
56
68
57
69
# generate all tophat scripts:
58
70
59
71
#samples = [ "DDX7", "DDX8", "DDX9", "SH790"]
60
72
#basedir='/home/rwang/scratch1/rnaseq/human/Feb12/'
61
73
config = json .loads (open ("config_splicetrap.json" ).read ())
62
- makeSpliceTrapScripts (config ['basedir' ], config ['samples' ], config ['reference' ], config ['readsize' ], config ['cutoff' ], config [ 'outputFilePrefix' ] )
74
+ makeSpliceTrapScripts (config ['basedir' ], config ['samples' ], config ['reference' ], config ['readsize' ], config ['cutoff' ] )
63
75
0 commit comments