2022-09-09 20:30:21,026 INFO Cutadapt Mode: Paired-end 2022-09-09 20:30:21,027 INFO Cutadapt Input FASTQ [R1]: /dreamworld/ngs_data/20220816_Novogene_data/X201SC22041027-Z01-F003/01.RawData/N41/N41_FKDL220180557-1A_HJCT5DSX3_L1_1.fq.gz 2022-09-09 20:30:21,027 INFO Cutadapt Input FASTQ [R2]: /dreamworld/ngs_data/20220816_Novogene_data/X201SC22041027-Z01-F003/01.RawData/N41/N41_FKDL220180557-1A_HJCT5DSX3_L1_2.fq.gz 2022-09-09 20:30:21,027 INFO Cutadapt Output FASTQ [R1]: /tmp/tmpav0qc6wj/adapter_R1_0.fastq.gz 2022-09-09 20:30:21,027 INFO Cutadapt Output FASTQ [R2]: /tmp/tmpav0qc6wj/adapter_R2_0.fastq.gz 2022-09-09 20:30:21,027 INFO Cutadapt Adapter: illumina 2022-09-09 20:30:21,027 DEBUG SimpleSubprocess cutadapt -j 10 -e 0.2 -m 8 -a AGATCGGAAGAGCACACGTCTGAACTCCAGTCA -A AGATCGGAAGAGCGTCGTGTAGGGAAAGAGTGT -o "/tmp/tmpav0qc6wj/adapter_R1_0.fastq.gz" -p "/tmp/tmpav0qc6wj/adapter_R2_0.fastq.gz" "/dreamworld/ngs_data/20220816_Novogene_data/X201SC22041027-Z01-F003/01.RawData/N41/N41_FKDL220180557-1A_HJCT5DSX3_L1_1.fq.gz" "/dreamworld/ngs_data/20220816_Novogene_data/X201SC22041027-Z01-F003/01.RawData/N41/N41_FKDL220180557-1A_HJCT5DSX3_L1_2.fq.gz" > "/dreamworld/ngs_data/NIPT/N41/N41.InputItem0.cutadapt.txt" 2022-09-09 20:30:26,633 INFO SimpleSubprocess Cutadapt.Trim - 0:00:05 2022-09-09 20:30:26,634 INFO FastQC FastQ: /tmp/tmpav0qc6wj/adapter_R1_0.fastq.gz 2022-09-09 20:30:26,634 INFO FastQC Report: /dreamworld/ngs_data/NIPT/N41/N41.InputItem0.fastqc.html 2022-09-09 20:30:26,650 INFO FastQC Subsample: 1000000 2022-09-09 20:30:26,650 DEBUG SimpleSubprocess zcat -q "/tmp/tmpav0qc6wj/adapter_R1_0.fastq.gz" | head -4000000 | gzip -c > "/tmp/tmpib2eky_3/sample.fastq.gz" 2022-09-09 20:30:33,908 INFO SimpleSubprocess FastQC.Sampling - 0:00:07 2022-09-09 20:30:33,908 DEBUG SimpleSubprocess fastqc -o "/tmp/tmpib2eky_3" -t 10 "/tmp/tmpib2eky_3/sample.fastq.gz" 2022-09-09 20:30:38,110 INFO SimpleSubprocess FastQC.Analysis - 0:00:04 2022-09-09 20:30:38,111 DEBUG SimpleSubprocess cp "/tmp/tmpib2eky_3/sample_fastqc.html" "/dreamworld/ngs_data/NIPT/N41/N41.InputItem0.fastqc.html" 2022-09-09 20:30:38,114 INFO SimpleSubprocess FastQC.Move - 0:00:00 2022-09-09 20:30:38,118 INFO BWA R1: /tmp/tmpav0qc6wj/adapter_R1_0.fastq.gz 2022-09-09 20:30:38,118 INFO BWA R2: /tmp/tmpav0qc6wj/adapter_R2_0.fastq.gz 2022-09-09 20:30:38,118 INFO BWA Output BAM: /tmp/tmpav0qc6wj/temp_0.bam 2022-09-09 20:30:38,118 INFO BWA Reference: /dreamworld/databases/hg19_canonical/hg19_canonical.fa 2022-09-09 20:30:38,118 INFO BWA RG Header: @RG\tID:FCHJCT5DSX3.L1\tPL:ILLUMINA\tPU:FCHJCT5DSX3.L1.GGCTACAT\tLB:LIB-N41-002\tSM:N41 2022-09-09 20:30:38,140 DEBUG SimpleSubprocess source /dreamworld/miniconda3/bin/activate gatk; set -o pipefail; bwa mem -R "@RG\tID:FCHJCT5DSX3.L1\tPL:ILLUMINA\tPU:FCHJCT5DSX3.L1.GGCTACAT\tLB:LIB-N41-002\tSM:N41" -t 10 -v 1 "/dreamworld/databases/hg19_canonical/hg19_canonical.fa" "/tmp/tmpav0qc6wj/adapter_R1_0.fastq.gz" "/tmp/tmpav0qc6wj/adapter_R2_0.fastq.gz" | gatk SortSam --VERBOSITY ERROR --TMP_DIR "/tmp/tmpuqvh0zo8" -SO queryname -I "/dev/stdin" -O "/tmp/tmpav0qc6wj/temp_0.bam" 2022-09-09 20:31:19,304 INFO SimpleSubprocess BWA.AlignAndSort - 0:00:41 2022-09-09 20:31:19,304 DEBUG SimpleSubprocess cp "/tmp/tmpav0qc6wj/temp_0.bam" "/dreamworld/ngs_data/NIPT/N41/IRs/N41.primary.bam" 2022-09-09 20:31:19,350 INFO SimpleSubprocess DaemonicPipe.CopyBAM - 0:00:00 2022-09-09 20:31:19,351 DEBUG SimpleSubprocess samtools flagstat -O tsv "/dreamworld/ngs_data/NIPT/N41/IRs/N41.primary.bam" > "/dreamworld/ngs_data/NIPT/N41/N41.primary_stats.txt" 2022-09-09 20:31:19,910 INFO SimpleSubprocess DaemonicPipe.FlagStats - 0:00:00 2022-09-09 20:31:19,928 INFO MarkDuplicates Input: /dreamworld/ngs_data/NIPT/N41/IRs/N41.primary.bam 2022-09-09 20:31:19,929 INFO MarkDuplicates Output: /dreamworld/ngs_data/NIPT/N41/IRs/N41.dupless.bam 2022-09-09 20:31:19,929 INFO MarkDuplicates Metrics: /dreamworld/ngs_data/NIPT/N41/N41.md_metrics.txt 2022-09-09 20:31:19,929 DEBUG SimpleSubprocess source /dreamworld/miniconda3/bin/activate gatk; set -o pipefail; gatk --java-options "-XX:+UseParallelGC -XX:ParallelGCThreads=2" MarkDuplicates --REMOVE_DUPLICATES true --VERBOSITY ERROR --ASSUME_SORT_ORDER queryname --TMP_DIR "/tmp/tmp3e2z2i_r" -M "/dreamworld/ngs_data/NIPT/N41/N41.md_metrics.txt" -I "/dreamworld/ngs_data/NIPT/N41/IRs/N41.primary.bam" -O "/dev/stdout" | gatk SortSam --VERBOSITY ERROR --TMP_DIR "/tmp/tmp3e2z2i_r" -SO coordinate -I "/dev/stdin" -O "/dreamworld/ngs_data/NIPT/N41/IRs/N41.dupless.bam" 2022-09-09 20:31:34,065 INFO SimpleSubprocess MarkDuplicates.RemoveAndSort - 0:00:14 2022-09-09 20:31:34,065 DEBUG SimpleSubprocess source /dreamworld/miniconda3/bin/activate gatk; gatk BuildBamIndex -I "/dreamworld/ngs_data/NIPT/N41/IRs/N41.dupless.bam" 2022-09-09 20:31:39,619 INFO SimpleSubprocess MarkDuplicates.Index - 0:00:05 2022-09-09 20:31:39,619 INFO CoverageStats BAM File: /dreamworld/ngs_data/NIPT/N41/IRs/N41.dupless.bam 2022-09-09 20:31:39,619 INFO CoverageStats Reference: /dreamworld/databases/hg19_canonical/hg19_canonical.fa 2022-09-09 20:31:39,619 INFO CoverageStats Capture BED: /dreamworld/databases/hg19_canonical/capture/KAPA_HyperExome/KAPA_HyperExome.capture.bed 2022-09-09 20:31:39,620 DEBUG SimpleSubprocess awk 'BEGIN {FS="\t"}; {print $1 FS "0" FS $2}' "/dreamworld/databases/hg19_canonical/hg19_canonical.fa.fai" > "/tmp/tmp48bka_96/genome.bed" 2022-09-09 20:31:39,622 INFO SimpleSubprocess PrepareGenomeBED.Create - 0:00:00 2022-09-09 20:31:39,623 DEBUG SimpleSubprocess bedtools subtract -a "/tmp/tmp48bka_96/genome.bed" -b "/dreamworld/databases/hg19_canonical/capture/KAPA_HyperExome/KAPA_HyperExome.capture.bed" | sed -e 's/$/\t\./' > "/tmp/tmp48bka_96/not_capture.bed" 2022-09-09 20:31:42,030 INFO SimpleSubprocess CoverageStats.CreateNotCaptureBed - 0:00:02 2022-09-09 20:31:42,030 DEBUG SimpleSubprocess bedtools coverage -hist -sorted -g "/dreamworld/databases/hg19_canonical/hg19_canonical.fa.fai" -a "/dreamworld/databases/hg19_canonical/capture/KAPA_HyperExome/KAPA_HyperExome.capture.bed" -b "/dreamworld/ngs_data/NIPT/N41/IRs/N41.dupless.bam" | grep -P "^all.*$" > "/tmp/tmp48bka_96/capture.csv" 2022-09-09 20:31:43,940 INFO SimpleSubprocess CoverageStats.CaptureCoverage - 0:00:01 2022-09-09 20:31:43,940 DEBUG SimpleSubprocess bedtools coverage -hist -sorted -g "/dreamworld/databases/hg19_canonical/hg19_canonical.fa.fai" -a "/tmp/tmp48bka_96/not_capture.bed" -b "/dreamworld/ngs_data/NIPT/N41/IRs/N41.dupless.bam" | grep -P "^all.*$" > "/tmp/tmp48bka_96/not_capture.csv" 2022-09-09 20:32:04,342 INFO SimpleSubprocess CoverageStats.NotCaptureCoverage - 0:00:20