-
Notifications
You must be signed in to change notification settings - Fork 79
/
prepare-test-data.sh
executable file
·64 lines (55 loc) · 1.5 KB
/
prepare-test-data.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
#!/bin/bash
set -e
set -o pipefail
# Linux readlink -f alternative for Mac OS X
function readlinkUniversal() {
targetFile=$1
cd $(dirname $targetFile)
targetFile=$(basename $targetFile)
# iterate down a (possible) chain of symlinks
while [ -L "$targetFile" ]; do
targetFile=$(readlink $targetFile)
cd $(dirname $targetFile)
targetFile=$(basename $targetFile)
done
# compute the canonicalized name by finding the physical path
# for the directory we're in and appending the target file.
phys_dir=$(pwd -P)
result=$phys_dir/$targetFile
echo $result
}
os=$(uname)
dir=""
case $os in
Darwin)
dir=$(dirname "$(readlinkUniversal "$0")")
;;
Linux)
dir="$(dirname "$(readlink -f "$0")")"
;;
FreeBSD)
dir=$(dirname "$(readlinkUniversal "$0")")
;;
*)
echo "Unknown OS."
exit 1
;;
esac
if [ "${1}" == "unit" ];then
cd "$dir/src/test/resources/sequences/big/"
cd yf_sample_data
parallel --tagstring "{/.}" -j5 "${dir}/mixcr" -Xmx500m analyze generic-bcr-amplicon -f \
--species hs \
--rna \
--floating-left-alignment-boundary \
--floating-right-alignment-boundary C \
--add-step assembleContigs \
--split-clones-by V --split-clones-by J --split-clones-by C \
-M assemble.sortBySequence=true \
--assemble-clonotypes-by CDR3 \
--impute-germline-on-export \
"{}_L001_R1.fastq.gz" "{}_L001_R2.fastq.gz" "{}" ::: Ig-2_S2 Ig-3_S3 Ig-4_S4 Ig-5_S5 Ig1_S1 Ig2_S2 Ig3_S3 Ig4_S4 Ig5_S5
else
echo "Data pre-processing skipped for: ${1}"
exit 0
fi