Skip to content
Snippets Groups Projects
Commit 92720e6b authored by Tim O'Donnell's avatar Tim O'Donnell
Browse files

Add data_expression download

parent 0805397e
No related merge requests found
#!/bin/bash
#
# Download published gene expression data corresponding to some of our mass
# spec datasets.
#
#
set -e
set -x
DOWNLOAD_NAME=data_expression
SCRATCH_DIR=${TMPDIR-/tmp}/mhcflurry-downloads-generation
SCRIPT_ABSOLUTE_PATH="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)/$(basename "${BASH_SOURCE[0]}")"
SCRIPT_DIR=$(dirname "$SCRIPT_ABSOLUTE_PATH")
mkdir -p "$SCRATCH_DIR"
rm -rf "$SCRATCH_DIR/$DOWNLOAD_NAME"
mkdir "$SCRATCH_DIR/$DOWNLOAD_NAME"
# Send stdout and stderr to a logfile included with the archive.
exec > >(tee -ia "$SCRATCH_DIR/$DOWNLOAD_NAME/LOG.txt")
exec 2> >(tee -ia "$SCRATCH_DIR/$DOWNLOAD_NAME/LOG.txt" >&2)
date
cd $SCRATCH_DIR/$DOWNLOAD_NAME
# Many cell line sequencing data is available from:
# Available from SRA [access required] at:
# https://www.ebi.ac.uk/ega/studies/EGAS00001000610
# CCLE cell lines
DATASET=ccle
mkdir $DATASET
cd $DATASET
wget -q https://data.broadinstitute.org/ccle/CCLE_RNAseq_rsem_genes_tpm_20180929.txt.gz
wget -q https://data.broadinstitute.org/ccle/CCLE_miRNA_20181103.gct
cd ..
# B721.221
DATASET=b721221
mkdir $DATASET
cd $DATASET
wget -q https://www.ncbi.nlm.nih.gov/geo/download/?acc=GSE93315&format=file
cd ..
DATASET=pancan-xena
mkdir $DATASET
cd $DATASET
wget -q https://pancanatlas.xenahubs.net/download/probeMap/hugo_gencode_good_hg19_V24lift37_probemap
wget -q https://pancanatlas.xenahubs.net/download/EB++AdjustPANCAN_IlluminaHiSeq_RNASeqV2.geneExp.xena.gz
cd ..
cp $SCRIPT_ABSOLUTE_PATH .
bzip2 LOG.txt
RESULT="$SCRATCH_DIR/${DOWNLOAD_NAME}.$(date +%Y%m%d).tar.bz2"
tar -cjf "$RESULT" *
echo "Created archive: $RESULT"
......@@ -37,6 +37,10 @@ releases:
url: https://github.com/openvax/mhcflurry/releases/download/pre-1.4.0/data_mass_spec_annotated.20190930.tar.bz2
default: false
- name: data_expression
url: https://github.com/openvax/mhcflurry/releases/download/1.4.0/data_expression.20191009.tar.bz2
default: false
- name: data_references
url: https://github.com/openvax/mhcflurry/releases/download/pre-1.4.0/data_references.20190927.tar.bz2
default: false
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment