-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathtest_run.bash
More file actions
executable file
·50 lines (40 loc) · 2.1 KB
/
test_run.bash
File metadata and controls
executable file
·50 lines (40 loc) · 2.1 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
#!/usr/bin/env bash
REALNAME=$(readlink -f $0)
SCRIPTDIR=$( cd "$( dirname "$REALNAME" )" && pwd )
# Download example data
echo -e "\nDownloading example data\n"
wget --no-check-certificate "https://trna.ucsc.edu/tDRnamer/data/examples/GM12878_AlkB_rep1_merged.fastq.gz"
wget --no-check-certificate "https://trna.ucsc.edu/tDRnamer/data/examples/ExampleSequences.fa"
wget --no-check-certificate "https://trna.ucsc.edu/tDRnamer/data/examples/ExampleNames.txt"
# Download hg38 reference genome sequence
echo -e "\nDownloading reference genome\n"
wget --no-check-certificate "https://trna.ucsc.edu/tDRnamer/data/examples/hg38_primary_assembly.fa.gz"
gzip -d hg38_primary_assembly.fa.gz
# Get tRNA information
echo -e "\nDownloading tRNA data\n"
wget --no-check-certificate "https://gtrnadb.ucsc.edu/genomes/eukaryota/Hsapi38/hg38-tRNAs.tar.gz"
tar xvf hg38-tRNAs.tar.gz
# Create reference database
echo -e "\nCreating reference database\n"
mkdir -p db
"$SCRIPTDIR/create_tDRnamer_db" -d db/hg38 -g hg38_primary_assembly.fa -t hg38-tRNAs-detailed.out -s hg38-tRNAs-detailed.ss -n hg38-tRNAs_name_map.txt -q
# Name tDRs from fastq
echo -e "\nExample Run 1\n"
mkdir -p run1
"$SCRIPTDIR/tDRnamer" -m seq -s GM12878_AlkB_rep1_merged.fastq.gz -d db/hg38 -r euk -o run1/GM12878_AlkB_rep1
# Name tDRs from fasta
echo -e "\nExample Run 2\n"
mkdir -p run2
"$SCRIPTDIR/tDRnamer" -m seq -s ExampleSequences.fa -d db/hg38 -r euk -o run2/ExampleSequences
# Name tDRs from fasta with maximum sensitivity
echo -e "\nExample Run 3\n"
mkdir -p run3
"$SCRIPTDIR/tDRnamer" -m seq -s ExampleSequences.fa -d db/hg38 -r euk --max -o run3/ExampleSequences
# Name tDRs from fasta with nucleotide variations
echo -e "\nExample Run 4\n"
mkdir -p run4
"$SCRIPTDIR/tDRnamer" -m seq -s ExampleSequences.fa -d db/hg38 -r euk --var -o run4/ExampleSequences
# Find tDRs by names
echo -e "\nExample Run 5\n"
mkdir -p run5
"$SCRIPTDIR/tDRnamer" -m name -n ExampleNames.txt -d db/hg38 -r euk -o run5/ExampleNames