From d7d436c2fa104d29570bad1668b4105ce71f2ec9 Mon Sep 17 00:00:00 2001
From: Laura Cook <l.cook2@student.unimelb.edu.au>
Date: Fri, 11 Sep 2020 12:14:24 +1000
Subject: [PATCH] first commit. script to subsample BAM files in a directory

---
 dunnart/scripts/subsample.sh | 17 +++++++++++++++++
 1 file changed, 17 insertions(+)
 create mode 100644 dunnart/scripts/subsample.sh

diff --git a/dunnart/scripts/subsample.sh b/dunnart/scripts/subsample.sh
new file mode 100644
index 0000000..322a400
--- /dev/null
+++ b/dunnart/scripts/subsample.sh
@@ -0,0 +1,17 @@
+
+
+TRA=($(for file in B*_PPq30.sorted.dedup.bam; do echo $file |cut -d "_" -f 1-2;done))
+
+echo ${TRA[@]}
+
+for tr in ${TRA[@]};
+
+do
+
+echo ${tr}
+
+frac=$( samtools idxstats ${tr}_PPq30.sorted.dedup.bam | cut -f3 | awk 'BEGIN {total=0} {total += $1} END {frac=10000000/total; if (frac > 1) {print 1} else {print frac}}' )
+
+samtools view -bs $frac ${tr}_PPq30.sorted.dedup.bam > ../../results_10M/bowtie2/${tr}_PPq30.sorted.dedup.bam
+
+done
-- 
GitLab