, fastq 4 .
GNU -L 4.
fastq , n * 4 .
, --pipe-part, --pipe-part -L, --pipe.
zcat file1.fastq.gz | parallel -j16 --pipe -L 4 --joblog split_log.txt --resume-failed "gzip > ${input_file}_child_{#}.gz"
, 1 , (.. 4 ). . , 16 , . , --round-robin , --resume-failed :
zcat file1.fastq.gz | parallel -j16 --pipe -L 4 --joblog split_log.txt --round-robin "gzip > ${input_file}_child_{#}.gz"
parallel 16 gzips, 100-200 /.
, fastq, , : fastq seqname, :
@EAS54_6_R1_2_1_413_324
CCCTTCTTGTCTTCAGCGTTTCTCC
+
;;3;;;;;;;;;;;;7;;;;;;;88
@EAS54_6_R1_2_1_540_792
TTGGCAGGCCAAGGCCGATGGATCA
+
;;;;;;;;;;;7;;;;;-;;;3;83
@EAS54_6_R1_2_1_443_348
GTTGCTTCTGGCGTGGGTGGGGGGG
+EAS54_6_R1_2_1_443_348
;;;;;;;;;;;9;7;;.7;393333
@EAS54_6_R. , ( ), , , @EAS54_6_R. .
, \n, @EAS54_6_R , --pipe-part. , . 1/16 file1-fastq:
parallel -a file1.fastq --block <<1/16th of the size of file1.fastq>> -j16 --pipe-part --recend '\n' --recstart '@EAS54_6_R' --joblog split_log.txt "gzip > ${input_file}_child_{#}.gz"
GNU Parallel 20161222, GNU Parallel . --block -1 : , 16 .
parallel -a file1.fastq --block -1 -j16 --pipe-part --recend '\n' --recstart '@EAS54_6_R' --joblog split_log.txt "gzip > ${input_file}_child_{#}.gz"
GNU Parallel : 20 /.
, , , :
parallel -a file1.fastq --pipe-part --block -1 -j16
--regexp --recend '\n' --recstart '@.*\n[A-Za-z\n\.~]'
my_command
, :
@
[A-Za-z\n\.~]
anything
anything
, "@", , [A-Za-z\n. ~], seqname , @.
, 1/16 , :
104214420 ( -N), , , , , 150 36 .