@@ -48,13 +48,10 @@ if [[ ! -f $YGENOME ]]; then
4848 echo " Parsing genome..."
4949 YPARSER=../EpitopeID/utility_scripts/genome_data/parsers/parse_sacCer3_Genome_FASTA.pl
5050 perl $YPARSER S288C_reference_genome_R64-1-1_20110203/S288C_reference_sequence_R64-1-1_20110203.fsa $YGENOME
51- echo " Complete"
5251 echo " BWA Indexing genome..."
5352 bwa index $YGENOME
54- echo " Complete"
5553 echo " Bowtie2 Indexing genome..."
5654 bowtie2-build $YGENOME $YGENOME
57- echo " Complete"
5855 rm S288C_reference_genome_R64-1-1_20110203.tgz
5956 rm -r S288C_reference_genome_R64-1-1_20110203/
6057fi
@@ -76,17 +73,39 @@ if [[ ! -f $HGENOME ]]; then
7673 chmod 777 twoBitToFa
7774 echo " Converting 2bit to fa..."
7875 ./twoBitToFa hg19.2bit $HGENOME .raw
79- echo " Complete"
8076 echo " Strip haplotypes..."
8177 python scripts/parse_hg19_Genome_FASTA.py $HGENOME .raw > $HGENOME
82- echo " Complete"
8378 echo " BWA Indexing genome..."
8479 bwa index $HGENOME
80+ echo " Bowtie2 Indexing genome..."
8581 bowtie2-build $HGENOME $HGENOME
8682 echo " Complete"
8783 rm twoBitToFa hg19.2bit $HGENOME .raw
8884fi
8985
86+
87+ # Download Human Genome (hg38)
88+ HGENOME=input/hg38.fa
89+ if [[ ! -f $HGENOME ]]; then
90+ echo " **Human genome not found, downloading to $HGENOME ..."
91+ wget -N http://hgdownload.cse.ucsc.edu/goldenPath/hg38/bigZips/hg38.2bit
92+ # Check for the existence of twoBitToFa, download if not present and make globally executable
93+ if ! command -v twoBitToFa; then
94+ unameOUT=" $( uname -s) "
95+ if [ $unameOUT == " Darwin" ]; then
96+ wget -N http://hgdownload.soe.ucsc.edu/admin/exe/macOSX.x86_64/twoBitToFa
97+ else
98+ wget -N http://hgdownload.soe.ucsc.edu/admin/exe/linux.x86_64.v369/twoBitToFa
99+ fi
100+ fi
101+ chmod 777 twoBitToFa
102+ echo " Converting 2bit to fa..."
103+ ./twoBitToFa hg38.2bit $HGENOME
104+ echo " BWA Indexing genome..."
105+ bwa index $HGENOME
106+ rm twoBitToFa hg38.2bit
107+ fi
108+
90109# Build Yeast EpiID with R500
91110YEPIDB=db/sacCer3_EpiID
92111[ -d $YEPIDB ] || cp -r ../EpitopeID/sacCer3_EpiID/ $YEPIDB
@@ -95,10 +114,8 @@ if [ ! -f $YEPIDB/FASTA_genome/genome.fa ]; then
95114 cp input/sacCer3.fa $YEPIDB /FASTA_genome/genome.fa
96115 echo " BWA Indexing genome..."
97116 bwa index $YEPIDB /FASTA_genome/genome.fa
98- echo " Complete"
99117 echo " Bowtie2 Indexing genome..."
100118 bowtie2-build $YEPIDB /FASTA_genome/genome.fa $YEPIDB /FASTA_genome/genome.fa
101- echo " Complete"
102119fi
103120echo " Setup Random Epitope for Yeast EpiID..."
104121cp input/RAND_500.fa $YEPIDB /FASTA_tag/Tag_DB/
@@ -124,7 +141,6 @@ if [ ! -f $HEPIDB/FASTA_genome/genome.fa ]; then
124141 # echo "Complete"
125142 echo " Bowtie2 Indexing genome..."
126143 bowtie2-build $HEPIDB /FASTA_genome/genome.fa $HEPIDB /FASTA_genome/genome.fa
127- echo " Complete"
128144fi
129145echo " Setup Random Epitope for Human EpiID..."
130146cp input/RAND_500.fa $HEPIDB /FASTA_tag/Tag_DB/
@@ -167,9 +183,18 @@ ln -s ../../DeletionID/sacCer3_Del
167183cd $WRK
168184
169185# Add Yeast & Human StrainID DB to paper/db
186+ cd $WRK /../StrainID
187+ tar -xvf hg38_VCF
188+ tar -xvf hg38_ENCODE
189+ cd utility_scripts
190+ bash generate_hg38_VariantDB.#! /bin/sh
191+ mv hg38_DepMap ../
170192cd $WRK /db
171193ln -s ../../StrainID/sacCer3_VCF
172194ln -s ../../StrainID/hg19_VCF
195+ ln -s ../../StrainID/hg38_VCF
196+ ln -s ../../StrainID/hg38_ENCODE
197+ ln -s ../../StrainID/hg38_DepMap
173198cd $WRK
174199
175200# Setup color-space index for yeast genome
0 commit comments