diff --git a/mouse/scripts/subsample.sh b/mouse/scripts/subsample.sh new file mode 100644 index 0000000000000000000000000000000000000000..da0efba9b439f61f7f2adc8d2c379daccb90259a --- /dev/null +++ b/mouse/scripts/subsample.sh @@ -0,0 +1,17 @@ + + +TRA=($(for file in *_q30.sorted.dedup.bam; do echo $file |cut -d "_" -f 1-3;done)) + +echo ${TRA[@]} + +for tr in ${TRA[@]}; + +do + +echo ${tr} + +frac=$( samtools idxstats ${tr}_q30.sorted.dedup.bam | cut -f3 | awk 'BEGIN {total=0} {total += $1} END {frac=10000000/total; if (frac > 1) {print 1} else {print frac}}' ) + +samtools view -bs $frac ${tr}_q30.sorted.dedup.bam > ../../results_10M/bwa/${tr}_q30.sorted.dedup.bam + +done