-
Notifications
You must be signed in to change notification settings - Fork 55
/
large_test.sh
executable file
·40 lines (32 loc) · 1.02 KB
/
large_test.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
#!/bin/bash
# This script downloads a full GUIDE-Seq dataset and performs runs the analysis pipeline.
# It should be run from the test directory.
cd large_test
# Create an output directory with a commit id hash suffix
OUTDIR=output.`git log --pretty=format:'%h' -n 1`
mkdir -p $OUTDIR
ln -sf $OUTDIR output
# Install bwa
git clone https://github.com/lh3/bwa.git
cd bwa
git checkout tags/0.7.9a
make
cd ..
PATH=`pwd`/bwa:$PATH
# Install bedtools
git clone https://github.com/arq5x/bedtools2.git
cd bedtools2
git checkout tags/v2.25.0
make
cd ..
PATH=`pwd`/bedtools2/bin:$PATH
# Download test data FASTQs and manifest
wget http://aryee.mgh.harvard.edu/guideseq/data/guideseq_test_fastq.zip
unzip guideseq_test_fastq.zip
# Download the reference genome
wget http://www.broadinstitute.org/ftp/pub/seq/references/Homo_sapiens_assembly19.fasta
# Run analysis pipeline
python ../../guideseq/guideseq.py all -m test_manifest.yaml
# Check that output tables match the reference output
cd output/filtered
md5sum -c ../../reference_output/md5.txt