/home/yoshitake.kazutoshi/files/m256y/pp-dev/yoshitake/PortablePipeline/PortablePipeline/scripts/pp 'post-assemble~coverage-length-graph_by-minimap2' -c 16 -m 32 -x true input_1/scaffolds.fasta input_2 Checking the realpath of input files. 1 script: /suikou/files/m256y/yoshitake.kazutoshi/work/pp-dev/yoshitake/PortablePipeline/PortablePipeline/scripts/post-assemble~coverage-length-graph_by-minimap2 Containers: c2997108/centos6:2-bwa-0.7.17-r1198-dirty c2997108/ubuntu20:R-2_gplots centos:centos6 quay.io/biocontainers/minimap2:2.28--h577a1d6_4 quay.io/biocontainers/samtools:1.19--h50ea8bc_0 quay.io/biocontainers/seqkit:0.12.1--0 using docker ++ set -o pipefail + set -eux + set -o pipefail + ref=input_1/scaffolds.fasta + '[' '!' -e input_1/scaffolds.fasta.fai ']' + xargs '-d\n' -I '{}' -P 1 bash -c '{}' ++ find input_2/ -maxdepth 1 ++ egrep '[.]f(ast|)q(|[.]gz)$' + for i in `find $input_2/ -maxdepth 1 |egrep '[.]f(ast|)q(|[.]gz)$' || true` ++ basename input_2/test_1.fq + i2=test_1.fq ++ basename input_2/test_1.fq ++ sed 's/[.]f\(ast\|\)q.*//' + samplename=test_1 + echo 'PPDOCNAME=pp`date +%Y%m%d_%H%M%S_%3N`_$RANDOM; echo $PPDOCNAME >> /home/yoshitake.kazutoshi/files/m256y/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2/pp-docker-list; docker run --name ${PPDOCNAME} -v $PWD:$PWD -w $PWD -v /suikou/files/m256y/yoshitake.kazutoshi:/suikou/files/m256y/yoshitake.kazutoshi -u 2007:600 -i --rm quay.io/biocontainers/minimap2:2.28--h577a1d6_4 minimap2 -t 16 -ax map-ont '\''input_1/scaffolds.fasta'\'' '\''input_2/test_1.fq'\'' | ( PPDOCNAME=pp`date +%Y%m%d_%H%M%S_%3N`_$RANDOM; echo $PPDOCNAME >> /home/yoshitake.kazutoshi/files/m256y/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2/pp-docker-list; docker run --name ${PPDOCNAME} -v $PWD:$PWD -w $PWD -v /suikou/files/m256y/yoshitake.kazutoshi:/suikou/files/m256y/yoshitake.kazutoshi -u 2007:600 -i --rm quay.io/biocontainers/samtools:1.19--h50ea8bc_0 samtools view -h -F 0x900 ) > '\''test_1.fq.sam'\''' + for i in `find $input_2/ -maxdepth 1 |egrep '[.]f(ast|)q(|[.]gz)$' || true` ++ basename input_2/test_2.fq + i2=test_2.fq ++ basename input_2/test_2.fq ++ sed 's/[.]f\(ast\|\)q.*//' + samplename=test_2 + echo 'PPDOCNAME=pp`date +%Y%m%d_%H%M%S_%3N`_$RANDOM; echo $PPDOCNAME >> /home/yoshitake.kazutoshi/files/m256y/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2/pp-docker-list; docker run --name ${PPDOCNAME} -v $PWD:$PWD -w $PWD -v /suikou/files/m256y/yoshitake.kazutoshi:/suikou/files/m256y/yoshitake.kazutoshi -u 2007:600 -i --rm quay.io/biocontainers/minimap2:2.28--h577a1d6_4 minimap2 -t 16 -ax map-ont '\''input_1/scaffolds.fasta'\'' '\''input_2/test_2.fq'\'' | ( PPDOCNAME=pp`date +%Y%m%d_%H%M%S_%3N`_$RANDOM; echo $PPDOCNAME >> /home/yoshitake.kazutoshi/files/m256y/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2/pp-docker-list; docker run --name ${PPDOCNAME} -v $PWD:$PWD -w $PWD -v /suikou/files/m256y/yoshitake.kazutoshi:/suikou/files/m256y/yoshitake.kazutoshi -u 2007:600 -i --rm quay.io/biocontainers/samtools:1.19--h50ea8bc_0 samtools view -h -F 0x900 ) > '\''test_2.fq.sam'\''' [M::mm_idx_gen::0.217*1.10] collected minimizers [M::mm_idx_gen::0.303*1.53] sorted minimizers [M::main::0.303*1.52] loaded/built the index for 2111 target sequence(s) [M::mm_mapopt_update::0.323*1.49] mid_occ = 19 [M::mm_idx_stat] kmer size: 15; skip: 10; is_hpc: 0; #seq: 2111 [M::mm_idx_stat::0.338*1.47] distinct minimizers: 955730 (97.96% are singletons); average occurrences: 1.039; average spacing: 5.390; total length: 5354294 [M::worker_pipeline::0.487*2.70] mapped 10000 sequences [M::main] Version: 2.28-r1209 [M::main] CMD: minimap2 -t 16 -ax map-ont input_1/scaffolds.fasta input_2/test_1.fq [M::main] Real time: 0.504 sec; CPU: 1.333 sec; Peak RSS: 0.075 GB [M::mm_idx_gen::0.282*1.07] collected minimizers [M::mm_idx_gen::0.329*1.89] sorted minimizers [M::main::0.329*1.89] loaded/built the index for 2111 target sequence(s) [M::mm_mapopt_update::0.351*1.83] mid_occ = 19 [M::mm_idx_stat] kmer size: 15; skip: 10; is_hpc: 0; #seq: 2111 [M::mm_idx_stat::0.370*1.79] distinct minimizers: 955730 (97.96% are singletons); average occurrences: 1.039; average spacing: 5.390; total length: 5354294 [M::worker_pipeline::0.515*2.90] mapped 10000 sequences [M::main] Version: 2.28-r1209 [M::main] CMD: minimap2 -t 16 -ax map-ont input_1/scaffolds.fasta input_2/test_2.fq [M::main] Real time: 0.529 sec; CPU: 1.508 sec; Peak RSS: 0.067 GB + cat + for i in *.sam + xargs '-d\n' -I '{}' -P 16 bash -c '{}' + echo 'PPDOCNAME=pp`date +%Y%m%d_%H%M%S_%3N`_$RANDOM; echo $PPDOCNAME >> /home/yoshitake.kazutoshi/files/m256y/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2/pp-docker-list; docker run --name ${PPDOCNAME} -v $PWD:$PWD -w $PWD -v /suikou/files/m256y/yoshitake.kazutoshi:/suikou/files/m256y/yoshitake.kazutoshi -u 2007:600 -i --rm c2997108/ubuntu20:R-2_gplots bash run-cleanup.sh "test_1.fq.sam" "0.3" "0" "input_1/scaffolds.fasta"' + for i in *.sam + echo 'PPDOCNAME=pp`date +%Y%m%d_%H%M%S_%3N`_$RANDOM; echo $PPDOCNAME >> /home/yoshitake.kazutoshi/files/m256y/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2/pp-docker-list; docker run --name ${PPDOCNAME} -v $PWD:$PWD -w $PWD -v /suikou/files/m256y/yoshitake.kazutoshi:/suikou/files/m256y/yoshitake.kazutoshi -u 2007:600 -i --rm c2997108/ubuntu20:R-2_gplots bash run-cleanup.sh "test_2.fq.sam" "0.3" "0" "input_1/scaffolds.fasta"' R version 4.1.2 (2021-11-01) -- "Bird Hippie" Copyright (C) 2021 The R Foundation for Statistical Computing Platform: x86_64-pc-linux-gnu (64-bit) R is free software and comes with ABSOLUTELY NO WARRANTY. You are welcome to redistribute it under certain conditions. Type 'license()' or 'licence()' for distribution details. R is a collaborative project with many contributors. Type 'contributors()' for more information and 'citation()' on how to cite R or R packages in publications. Type 'demo()' for some demos, 'help()' for on-line help, or 'help.start()' for an HTML browser interface to help. Type 'q()' to quit R. R version 4.1.2 (2021-11-01) -- "Bird Hippie" Copyright (C) 2021 The R Foundation for Statistical Computing Platform: x86_64-pc-linux-gnu (64-bit) R is free software and comes with ABSOLUTELY NO WARRANTY. You are welcome to redistribute it under certain conditions. Type 'license()' or 'licence()' for distribution details. R is a collaborative project with many contributors. Type 'contributors()' for more information and 'citation()' on how to cite R or R packages in publications. Type 'demo()' for some demos, 'help()' for on-line help, or 'help.start()' for an HTML browser interface to help. Type 'q()' to quit R. > library(Cairo); a=read.table("test_1.fq.sam2.cov",sep="\t",row.names=1); > CairoPNG(file="test_1.fq.sam2.cov.png",width=1000,height=1000); sunflowerplot(x=a[,1], y=a[,3], xlab="coverage [fold]", ylab="contig length [bp]", log="xy"); dev.off() > library(Cairo); a=read.table("test_2.fq.sam2.cov",sep="\t",row.names=1); > CairoPNG(file="test_2.fq.sam2.cov.png",width=1000,height=1000); sunflowerplot(x=a[,1], y=a[,3], xlab="coverage [fold]", ylab="contig length [bp]", log="xy"); dev.off() Error in rep.int(i.multi, number[number > 1]) : invalid 'times' value Calls: sunflowerplot -> sunflowerplot.default Execution halted Error in rep.int(i.multi, number[number > 1]) : invalid 'times' value Calls: sunflowerplot -> sunflowerplot.default Execution halted R version 4.1.2 (2021-11-01) -- "Bird Hippie" Copyright (C) 2021 The R Foundation for Statistical Computing Platform: x86_64-pc-linux-gnu (64-bit) R is free software and comes with ABSOLUTELY NO WARRANTY. You are welcome to redistribute it under certain conditions. Type 'license()' or 'licence()' for distribution details. R is a collaborative project with many contributors. Type 'contributors()' for more information and 'citation()' on how to cite R or R packages in publications. Type 'demo()' for some demos, 'help()' for on-line help, or 'help.start()' for an HTML browser interface to help. Type 'q()' to quit R. R version 4.1.2 (2021-11-01) -- "Bird Hippie" Copyright (C) 2021 The R Foundation for Statistical Computing Platform: x86_64-pc-linux-gnu (64-bit) R is free software and comes with ABSOLUTELY NO WARRANTY. You are welcome to redistribute it under certain conditions. Type 'license()' or 'licence()' for distribution details. R is a collaborative project with many contributors. Type 'contributors()' for more information and 'citation()' on how to cite R or R packages in publications. Type 'demo()' for some demos, 'help()' for on-line help, or 'help.start()' for an HTML browser interface to help. Type 'q()' to quit R. > library(Cairo); data=read.table("test_1.fq.sam2.cov.hist",sep="\t", header = FALSE);colnames(data) <- c("Coverage", "Frequency"); CairoPNG(file="test_1.fq.sam2.cov.hist.png",width=1000,height=1000); plot(data$Coverage, data$Frequency, type = "o", col = "blue", main = "Coverage Histogram", xlab = "Depth", ylab = "Total bases of contigs"); dev.off() > library(Cairo); data=read.table("test_2.fq.sam2.cov.hist",sep="\t", header = FALSE);colnames(data) <- c("Coverage", "Frequency"); CairoPNG(file="test_2.fq.sam2.cov.hist.png",width=1000,height=1000); plot(data$Coverage, data$Frequency, type = "o", col = "blue", main = "Coverage Histogram", xlab = "Depth", ylab = "Total bases of contigs"); dev.off() null device 1 > null device 1 > ++ basename input_1/scaffolds.fasta + outname=scaffolds.fasta + awk '-F\t' 'FILENAME==ARGV[1]{len[$1]=$2} FILENAME!=ARGV[1]{bases[$1]+=$3} END{print "id\tcoverage\tmapped bases\tlength"; for(i in len){if(bases[i]>0){print i"\t"bases[i]/len[i]"\t"bases[i]+0"\t"len[i]}}}' input_1/scaffolds.fasta.fai test_1.fq.sam2.cov test_2.fq.sam2.cov + FUNC_RUN_DOCKER c2997108/ubuntu20:R-2_gplots R --vanilla + PP_RUN_IMAGE=c2997108/ubuntu20:R-2_gplots + shift + PP_RUN_DOCKER_CMD=("${@}") ++ date +%Y%m%d_%H%M%S_%3N + echo 'library(Cairo); a=read.table("scaffolds.fasta.output.txt",header = TRUE,sep="\t",row.names=1); CairoPNG(file="scaffolds.fasta.cov.png",width=1000,height=1000); sunflowerplot(x=a[,1], y=a[,3], xlab="coverage [fold]", ylab="contig length [bp]", log="xy"); dev.off()' + PPDOCNAME=pp20250302_170037_711_1102 + echo pp20250302_170037_711_1102 ++ id -u ++ id -g + docker run --name pp20250302_170037_711_1102 -v /suikou/files/m256y/yoshitake.kazutoshi/work/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2:/suikou/files/m256y/yoshitake.kazutoshi/work/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2 -w /suikou/files/m256y/yoshitake.kazutoshi/work/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2 -v /suikou/files/m256y/yoshitake.kazutoshi:/suikou/files/m256y/yoshitake.kazutoshi -u 2007:600 -i --rm c2997108/ubuntu20:R-2_gplots R --vanilla R version 4.1.2 (2021-11-01) -- "Bird Hippie" Copyright (C) 2021 The R Foundation for Statistical Computing Platform: x86_64-pc-linux-gnu (64-bit) R is free software and comes with ABSOLUTELY NO WARRANTY. You are welcome to redistribute it under certain conditions. Type 'license()' or 'licence()' for distribution details. R is a collaborative project with many contributors. Type 'contributors()' for more information and 'citation()' on how to cite R or R packages in publications. Type 'demo()' for some demos, 'help()' for on-line help, or 'help.start()' for an HTML browser interface to help. Type 'q()' to quit R. > library(Cairo); a=read.table("scaffolds.fasta.output.txt",header = TRUE,sep="\t",row.names=1); CairoPNG(file="scaffolds.fasta.cov.png",width=1000,height=1000); sunflowerplot(x=a[,1], y=a[,3], xlab="coverage [fold]", ylab="contig length [bp]", log="xy"); dev.off() null device 1 > + awk '-F\t' -v l=0.99 '{cnt[int($2)]+=$4; total+=$4; if(int($2)>max){max=int($2)}} END{for(i=1;i<=max;i++){print i"\t"cnt[i]+0; s+=cnt[i]; if(s>=total*l){print "over_"i"\t"total-s; break}}}' + tail -n+2 scaffolds.fasta.output.txt + echo 'library(Cairo); data=read.table("scaffolds.fasta.output.txt.hist",sep="\t", header = FALSE);colnames(data) <- c("Coverage", "Frequency"); CairoPNG(file="scaffolds.fasta.output.txt.hist.png",width=1000,height=1000); plot(data$Coverage, data$Frequency, type = "o", col = "blue", main = "Coverage Histogram", xlab = "Depth", ylab = "Total bases of contigs"); dev.off()' + FUNC_RUN_DOCKER c2997108/ubuntu20:R-2_gplots R --vanilla + PP_RUN_IMAGE=c2997108/ubuntu20:R-2_gplots + shift + PP_RUN_DOCKER_CMD=("${@}") ++ date +%Y%m%d_%H%M%S_%3N + PPDOCNAME=pp20250302_170038_844_15608 + echo pp20250302_170038_844_15608 ++ id -u ++ id -g + docker run --name pp20250302_170038_844_15608 -v /suikou/files/m256y/yoshitake.kazutoshi/work/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2:/suikou/files/m256y/yoshitake.kazutoshi/work/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2 -w /suikou/files/m256y/yoshitake.kazutoshi/work/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2 -v /suikou/files/m256y/yoshitake.kazutoshi:/suikou/files/m256y/yoshitake.kazutoshi -u 2007:600 -i --rm c2997108/ubuntu20:R-2_gplots R --vanilla R version 4.1.2 (2021-11-01) -- "Bird Hippie" Copyright (C) 2021 The R Foundation for Statistical Computing Platform: x86_64-pc-linux-gnu (64-bit) R is free software and comes with ABSOLUTELY NO WARRANTY. You are welcome to redistribute it under certain conditions. Type 'license()' or 'licence()' for distribution details. R is a collaborative project with many contributors. Type 'contributors()' for more information and 'citation()' on how to cite R or R packages in publications. Type 'demo()' for some demos, 'help()' for on-line help, or 'help.start()' for an HTML browser interface to help. Type 'q()' to quit R. > library(Cairo); data=read.table("scaffolds.fasta.output.txt.hist",sep="\t", header = FALSE);colnames(data) <- c("Coverage", "Frequency"); CairoPNG(file="scaffolds.fasta.output.txt.hist.png",width=1000,height=1000); plot(data$Coverage, data$Frequency, type = "o", col = "blue", main = "Coverage Histogram", xlab = "Depth", ylab = "Total bases of contigs"); dev.off() null device 1 > + '[' true = true ']' + cat + for i in *.sam + echo 'PPDOCNAME=pp`date +%Y%m%d_%H%M%S_%3N`_$RANDOM; echo $PPDOCNAME >> /home/yoshitake.kazutoshi/files/m256y/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2/pp-docker-list; docker run --name ${PPDOCNAME} -v $PWD:$PWD -w $PWD -v /suikou/files/m256y/yoshitake.kazutoshi:/suikou/files/m256y/yoshitake.kazutoshi -u 2007:600 -i --rm quay.io/biocontainers/samtools:1.19--h50ea8bc_0 bash run-makebam.sh "test_1.fq.sam" "16"' + for i in *.sam + xargs '-d\n' -I '{}' -P 1 bash -c '{}' + echo 'PPDOCNAME=pp`date +%Y%m%d_%H%M%S_%3N`_$RANDOM; echo $PPDOCNAME >> /home/yoshitake.kazutoshi/files/m256y/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2/pp-docker-list; docker run --name ${PPDOCNAME} -v $PWD:$PWD -w $PWD -v /suikou/files/m256y/yoshitake.kazutoshi:/suikou/files/m256y/yoshitake.kazutoshi -u 2007:600 -i --rm quay.io/biocontainers/samtools:1.19--h50ea8bc_0 bash run-makebam.sh "test_2.fq.sam" "16"' [bam_sort_core] merging from 0 files and 16 in-memory blocks... [bam_sort_core] merging from 0 files and 16 in-memory blocks... + '[' true = true ']' + FUNC_RUN_DOCKER quay.io/biocontainers/samtools:1.19--h50ea8bc_0 samtools merge -f scaffolds.fasta.bam test_1.fq.sam.clean.bam test_2.fq.sam.clean.bam + PP_RUN_IMAGE=quay.io/biocontainers/samtools:1.19--h50ea8bc_0 + shift + PP_RUN_DOCKER_CMD=("${@}") ++ date +%Y%m%d_%H%M%S_%3N + PPDOCNAME=pp20250302_170042_655_7513 + echo pp20250302_170042_655_7513 ++ id -u ++ id -g + docker run --name pp20250302_170042_655_7513 -v /suikou/files/m256y/yoshitake.kazutoshi/work/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2:/suikou/files/m256y/yoshitake.kazutoshi/work/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2 -w /suikou/files/m256y/yoshitake.kazutoshi/work/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2 -v /suikou/files/m256y/yoshitake.kazutoshi:/suikou/files/m256y/yoshitake.kazutoshi -u 2007:600 -i --rm quay.io/biocontainers/samtools:1.19--h50ea8bc_0 samtools merge -f scaffolds.fasta.bam test_1.fq.sam.clean.bam test_2.fq.sam.clean.bam + FUNC_RUN_DOCKER quay.io/biocontainers/samtools:1.19--h50ea8bc_0 samtools index scaffolds.fasta.bam + PP_RUN_IMAGE=quay.io/biocontainers/samtools:1.19--h50ea8bc_0 + shift + PP_RUN_DOCKER_CMD=("${@}") ++ date +%Y%m%d_%H%M%S_%3N + PPDOCNAME=pp20250302_170043_842_11892 + echo pp20250302_170043_842_11892 ++ id -u ++ id -g + docker run --name pp20250302_170043_842_11892 -v /suikou/files/m256y/yoshitake.kazutoshi/work/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2:/suikou/files/m256y/yoshitake.kazutoshi/work/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2 -w /suikou/files/m256y/yoshitake.kazutoshi/work/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2 -v /suikou/files/m256y/yoshitake.kazutoshi:/suikou/files/m256y/yoshitake.kazutoshi -u 2007:600 -i --rm quay.io/biocontainers/samtools:1.19--h50ea8bc_0 samtools index scaffolds.fasta.bam + rm -f test_1.fq.sam test_2.fq.sam test_1.fq.sam2 test_2.fq.sam2 + tail -n+2 + awk '{a+=$5} END{print a}' + sed s/,//g ++ find input_2 -maxdepth 1 ++ egrep '[.]f(ast|)q(|[.]gz)$' + FUNC_RUN_DOCKER quay.io/biocontainers/seqkit:0.12.1--0 seqkit stats input_2/test_1.fq input_2/test_2.fq + PP_RUN_IMAGE=quay.io/biocontainers/seqkit:0.12.1--0 + shift + PP_RUN_DOCKER_CMD=("${@}") ++ date +%Y%m%d_%H%M%S_%3N + PPDOCNAME=pp20250302_170044_760_11789 + echo pp20250302_170044_760_11789 ++ id -u ++ id -g + docker run --name pp20250302_170044_760_11789 -v /suikou/files/m256y/yoshitake.kazutoshi/work/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2:/suikou/files/m256y/yoshitake.kazutoshi/work/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2 -w /suikou/files/m256y/yoshitake.kazutoshi/work/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2 -v /suikou/files/m256y/yoshitake.kazutoshi:/suikou/files/m256y/yoshitake.kazutoshi -u 2007:600 -i --rm quay.io/biocontainers/seqkit:0.12.1--0 seqkit stats input_2/test_1.fq input_2/test_2.fq + tail -n+2 scaffolds.fasta.output.txt + sort -k4,4nr -t ' ' + awk -v n=20 'NR<=n{a+=$2} END{print a/n}' ++ cat temp.txt ++ cat temp2.txt + awk -v total=2000000 -v depth=0.227699 -v n=20 'BEGIN{print "Total bases of input reads: "total" bp"; print "Average depth of the longest "n" contigs: "depth" x"; print "Estimated genome size: "total / depth" bp"}' + rm -f temp.txt temp2.txt + post_processing + '[' 1 = 1 ']' + rm -f /home/yoshitake.kazutoshi/files/m256y/pp-dev/yoshitake/test/post-assemble~coverage-length-graph_by-minimap2/pp-singularity-flag + '[' '' = y ']' + echo 0 + exit