From beb4d69de2d46b611bf918cc8c2c4558e4cacc33 Mon Sep 17 00:00:00 2001 From: Tim O'Donnell <timodonnell@gmail.com> Date: Mon, 19 Feb 2018 14:42:02 -0500 Subject: [PATCH] Include IEDB mass spec in mass spec curated training data --- downloads-generation/data_curated/GENERATE.sh | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/downloads-generation/data_curated/GENERATE.sh b/downloads-generation/data_curated/GENERATE.sh index 11eb52ce..e2ba9187 100755 --- a/downloads-generation/data_curated/GENERATE.sh +++ b/downloads-generation/data_curated/GENERATE.sh @@ -39,8 +39,6 @@ time python curate.py \ --out-csv curated_training_data.no_mass_spec.csv # With mass-spec data -# Note that we STILL drop mass-spec data from IEDB here, since this data seems -# low-quality. time python curate.py \ --data-iedb \ "$(mhcflurry-downloads path data_iedb)/mhc_ligand_full.csv.bz2" \ @@ -50,6 +48,7 @@ time python curate.py \ "$(mhcflurry-downloads path data_systemhcatlas)/data.csv.bz2" \ --data-abelin-mass-spec \ "$(mhcflurry-downloads path data_published)/abelin2017.hits.csv.bz2" \ + --include-iedb-mass-spec \ --out-csv curated_training_data.with_mass_spec.csv bzip2 curated_training_data.no_mass_spec.csv -- GitLab