From 804d89b782e49bf906560c538b775830cb756457 Mon Sep 17 00:00:00 2001
From: Tim O'Donnell <timodonnell@gmail.com>
Date: Sun, 15 Sep 2019 21:41:25 -0400
Subject: [PATCH] Copy training data into new models dir when doing model
 selection

---
 .../models_class1_pan/GENERATE.WITH_HPC_CLUSTER.sh              | 2 ++
 downloads-generation/models_class1_pan/GENERATE.sh              | 2 ++
 2 files changed, 4 insertions(+)

diff --git a/downloads-generation/models_class1_pan/GENERATE.WITH_HPC_CLUSTER.sh b/downloads-generation/models_class1_pan/GENERATE.WITH_HPC_CLUSTER.sh
index 84e040cd..5d21a2e6 100755
--- a/downloads-generation/models_class1_pan/GENERATE.WITH_HPC_CLUSTER.sh
+++ b/downloads-generation/models_class1_pan/GENERATE.WITH_HPC_CLUSTER.sh
@@ -62,6 +62,8 @@ do
         --max-models 32 \
         --num-jobs $NUM_JOBS --max-tasks-per-worker 1 --gpus $GPUS --max-workers-per-gpu 1
 
+    cp "$MODELS_DIR/train_data.csv.bz2" "models.${kind}/"
+
     # Percentile rank calibration is run on the cluster.
     # For now we calibrate percentile ranks only for alleles for which there
     # is training data. Calibrating all alleles would be too slow.
diff --git a/downloads-generation/models_class1_pan/GENERATE.sh b/downloads-generation/models_class1_pan/GENERATE.sh
index 216942dc..a0842d31 100755
--- a/downloads-generation/models_class1_pan/GENERATE.sh
+++ b/downloads-generation/models_class1_pan/GENERATE.sh
@@ -55,6 +55,8 @@ do
         --num-jobs 0 \
         --num-jobs $NUM_JOBS --max-tasks-per-worker 1 --gpus $GPUS --max-workers-per-gpu 1
 
+    cp "$MODELS_DIR/train_data.csv.bz2" "models.${kind}/"
+
     # For now we calibrate percentile ranks only for alleles for which there
     # is training data. Calibrating all alleles would be too slow.
     # This could be improved though.
-- 
GitLab