testTask=pipeline.collate(task_func=dummyFunc,
name='testTask',
input=output_from('getFiles'),
filter=formatter(raw_00+r"/seq_R[12](?P<FILENR>_[0-9]{4}).fastq.gz"),
output=[trim_05+'/seq_R1{FILENR[0]}_val_1.fq.gz', trim_05+'/seq_R2{FILENR[0]}_val_2.fq.gz'],
extras=[cmd]).mkdir(trim_05)
cmd="echo {inputfile}"
cmd="echo {inputfile[0]}"
testTask=pipeline.collate(task_func=dummyFunc,
name='testTask',
input=output_from('getFiles'),
filter=regex(r".*/seq_R[12](_[0-9]{4}).fastq.gz"),
output=[trim_05+r'/seq_R1\1_val_1.fq.gz', trim_05+r'/seq_R2\1_val_2.fq.gz'],
extras=[cmd]).mkdir(trim_05)
--
You received this message because you are subscribed to the Google Groups "ruffus_discuss" group.
To unsubscribe from this group and stop receiving emails from it, send an email to ruffus_discus...@googlegroups.com.
For more options, visit https://groups.google.com/d/optout.
from ruffus import *
def dummyFunc(inputFile,outputFile,cmd):
for file in outputFile:
with open(file, 'w') as oo: pass
return outputFile
def genFile(outputFile):
open(outputFile,'w')
return outputFile
tmpDir='/tmp/test150907'
raw_00=tmpDir+'/raw'
trim_05=tmpDir+'/trim1'
trim_10=tmpDir+'/trim2'
files= ['seq_R1_0001.fastq.gz', 'seq_R1_0002.fastq.gz', 'seq_R1_0003.fastq.gz', 'seq_R1_0004.fastq.gz', 'seq_R1_0005.fastq.gz', 'seq_R1_0006.fastq.gz', 'seq_R1_0007.fastq.gz', 'seq_R1_0008.fastq.gz', 'seq_R1_0009.fastq.gz', 'seq_R1_0010.fastq.gz', 'seq_R1_0011.fastq.gz', 'seq_R1_0012.fastq.gz', 'seq_R1_0013.fastq.gz', 'seq_R1_0014.fastq.gz', 'seq_R1_0015.fastq.gz', 'seq_R1_0016.fastq.gz', 'seq_R1_0017.fastq.gz', 'seq_R1_0018.fastq.gz', 'seq_R1_0019.fastq.gz', 'seq_R1_0020.fastq.gz', 'seq_R1_0021.fastq.gz', 'seq_R1_0022.fastq.gz', 'seq_R1_0023.fastq.gz', 'seq_R1_0024.fastq.gz', 'seq_R1_0025.fastq.gz', 'seq_R1_0026.fastq.gz', 'seq_R1_0027.fastq.gz', 'seq_R1_0028.fastq.gz', 'seq_R1_0029.fastq.gz', 'seq_R1_0030.fastq.gz', 'seq_R1_0031.fastq.gz', 'seq_R1_0032.fastq.gz', 'seq_R2_0001.fastq.gz', 'seq_R2_0002.fastq.gz', 'seq_R2_0003.fastq.gz', 'seq_R2_0004.fastq.gz', 'seq_R2_0005.fastq.gz', 'seq_R2_0006.fastq.gz', 'seq_R2_0007.fastq.gz', 'seq_R2_0008.fastq.gz', 'seq_R2_0009.fastq.gz', 'seq_R2_0010.fastq.gz', 'seq_R2_0011.fastq.gz', 'seq_R2_0012.fastq.gz', 'seq_R2_0013.fastq.gz', 'seq_R2_0014.fastq.gz', 'seq_R2_0015.fastq.gz', 'seq_R2_0016.fastq.gz', 'seq_R2_0017.fastq.gz', 'seq_R2_0018.fastq.gz', 'seq_R2_0019.fastq.gz', 'seq_R2_0020.fastq.gz', 'seq_R2_0021.fastq.gz', 'seq_R2_0022.fastq.gz', 'seq_R2_0023.fastq.gz', 'seq_R2_0024.fastq.gz', 'seq_R2_0025.fastq.gz', 'seq_R2_0026.fastq.gz', 'seq_R2_0027.fastq.gz', 'seq_R2_0028.fastq.gz', 'seq_R2_0029.fastq.gz', 'seq_R2_0030.fastq.gz', 'seq_R2_0031.fastq.gz', 'seq_R2_0032.fastq.gz']
files= [raw_00+'/'+file for file in files]
pipeline=Pipeline('test150907')
genFiles=pipeline.originate(task_func=genFile,
name='genFiles',
output=files).mkdir(raw_00)
cmd="echo {inputfile}"
testTask=pipeline.collate(task_func=dummyFunc,
name='testTask1',
input=output_from('genFiles'),
filter=formatter(raw_00+r"/seq_R[12](?P<FILENR>_[0-9]{4}).fastq.gz"),
output=[trim_05+'/seq_R1{FILENR[0]}_val_1.fq.gz', trim_05+'/seq_R2{FILENR[0]}_val_2.fq.gz'],
extras=[cmd]).mkdir(trim_05)
cmd="echo {inputfile[0]}"
testTask=pipeline.collate(task_func=dummyFunc,
name='testTask2',
input=output_from('genFiles'),
filter=formatter(raw_00+r"/seq_R[12](?P<FILENR>_[0-9]{4}).fastq.gz"),
output=[trim_10+'/seq_R1{FILENR[0]}_val_1.fq.gz', trim_10+'/seq_R2{FILENR[0]}_val_2.fq.gz'],
extras=[cmd]).mkdir(trim_10)
pipeline.run()
WARNING:
'In Task 'test150907.testTask2':' No jobs were run because no files names matched. Please make sure that the regular expression is correctly specified.