From 402d3176be6b61bece79a2f8d5309f5993a4be13 Mon Sep 17 00:00:00 2001
From: Tim O'Donnell <timodonnell@gmail.com>
Date: Thu, 15 Feb 2018 14:38:52 -0500
Subject: [PATCH] fixes

---
 .../models_class1/generate_hyperparameters.py |  2 +-
 .../models_class1_unselected/GENERATE.sh      |  2 +-
 mhcflurry/class1_affinity_predictor.py        | 17 ++++++------
 mhcflurry/class1_neural_network.py            |  1 +
 mhcflurry/parallelism.py                      | 27 +++++++++++++++++++
 .../train_allele_specific_models_command.py   | 16 +++++------
 ...st_train_allele_specific_models_command.py | 10 ++++---
 7 files changed, 52 insertions(+), 23 deletions(-)

diff --git a/downloads-generation/models_class1/generate_hyperparameters.py b/downloads-generation/models_class1/generate_hyperparameters.py
index 5b1bf5e0..e12f4ef5 100644
--- a/downloads-generation/models_class1/generate_hyperparameters.py
+++ b/downloads-generation/models_class1/generate_hyperparameters.py
@@ -59,7 +59,7 @@ base_hyperparameters = {
     ##########################################
     # TRAINING Data
     ##########################################
-    "train_data": {"subset": "all", "pretrain_min_points": 10000},
+    "train_data": {"subset": "all", "pretrain_min_points": 1000},
 }
 
 grid = []
diff --git a/downloads-generation/models_class1_unselected/GENERATE.sh b/downloads-generation/models_class1_unselected/GENERATE.sh
index c92baa02..ea9ba8a4 100755
--- a/downloads-generation/models_class1_unselected/GENERATE.sh
+++ b/downloads-generation/models_class1_unselected/GENERATE.sh
@@ -46,7 +46,7 @@ time mhcflurry-class1-train-allele-specific-models \
     --out-models-dir models \
     --percent-rank-calibration-num-peptides-per-length 0 \
     --min-measurements-per-allele 75 \
-    --num-jobs $(expr $PROCESSORS \* 2) --gpus $GPUS --max-workers-per-gpu 2 --max-tasks-per-worker 20
+    --num-jobs $(expr $PROCESSORS \* 2) --gpus $GPUS --max-workers-per-gpu 2 --max-tasks-per-worker 50
 
 cp $SCRIPT_ABSOLUTE_PATH .
 bzip2 LOG.txt
diff --git a/mhcflurry/class1_affinity_predictor.py b/mhcflurry/class1_affinity_predictor.py
index 2f0df6b8..01774c3c 100644
--- a/mhcflurry/class1_affinity_predictor.py
+++ b/mhcflurry/class1_affinity_predictor.py
@@ -510,14 +510,15 @@ class Class1AffinityPredictor(object):
         ]
 
         if train_rounds is not None:
-            for round in range(1, train_rounds.max() + 1):
-                round_mask = train_rounds >= round
-                sub_encodable_peptides = EncodableSequences.create(
-                    encodable_peptides.sequences[round_mask])
-                peptides_affinities_inequalities_per_round.append((
-                    sub_encodable_peptides,
-                    affinities[round_mask],
-                    None if inequalities is None else inequalities[round_mask]))
+            for round in sorted(set(train_rounds)):
+                round_mask = train_rounds > round
+                if round_mask.any():
+                    sub_encodable_peptides = EncodableSequences.create(
+                        encodable_peptides.sequences[round_mask])
+                    peptides_affinities_inequalities_per_round.append((
+                        sub_encodable_peptides,
+                        affinities[round_mask],
+                        None if inequalities is None else inequalities[round_mask]))
         n_rounds = len(peptides_affinities_inequalities_per_round)
 
         n_architectures = len(architecture_hyperparameters_list)
diff --git a/mhcflurry/class1_neural_network.py b/mhcflurry/class1_neural_network.py
index c81a3638..6ff042aa 100644
--- a/mhcflurry/class1_neural_network.py
+++ b/mhcflurry/class1_neural_network.py
@@ -758,6 +758,7 @@ class Class1NeuralNetwork(object):
         numpy.array of nM affinity predictions 
         """
         use_cache = (
+            self.prediction_cache is not None and
             allele_encoding is None and
             isinstance(peptides, EncodableSequences))
         if use_cache and peptides in self.prediction_cache:
diff --git a/mhcflurry/parallelism.py b/mhcflurry/parallelism.py
index b8ed6466..f4d0d910 100644
--- a/mhcflurry/parallelism.py
+++ b/mhcflurry/parallelism.py
@@ -1,3 +1,5 @@
+import traceback
+import sys
 from multiprocessing import Pool, Queue, cpu_count
 from six.moves import queue
 from multiprocessing.util import Finalize
@@ -98,3 +100,28 @@ def worker_init_entry_point(
 
     print("Initializing worker: %s" % str(kwargs))
     init_function(**kwargs)
+
+
+# Solution suggested in https://bugs.python.org/issue13831
+class WrapException(Exception):
+    """
+    Add traceback info to exception so exceptions raised in worker processes
+    can still show traceback info when re-raised in the parent.
+    """
+    def __init__(self):
+        exc_type, exc_value, exc_tb = sys.exc_info()
+        self.exception = exc_value
+        self.formatted = ''.join(traceback.format_exception(exc_type, exc_value, exc_tb))
+    def __str__(self):
+        return '%s\nOriginal traceback:\n%s' % (Exception.__str__(self), self.formatted)
+
+
+def call_wrapped(function, *args, **kwargs):
+    try:
+        return function(*args, **kwargs)
+    except:
+        raise WrapException()
+
+
+def call_wrapped_kwargs(function, kwargs):
+    return call_wrapped(function, **kwargs)
\ No newline at end of file
diff --git a/mhcflurry/train_allele_specific_models_command.py b/mhcflurry/train_allele_specific_models_command.py
index b21360cf..dddcc8f2 100644
--- a/mhcflurry/train_allele_specific_models_command.py
+++ b/mhcflurry/train_allele_specific_models_command.py
@@ -20,7 +20,8 @@ tqdm.monitor_interval = 0  # see https://github.com/tqdm/tqdm/issues/481
 
 from .class1_affinity_predictor import Class1AffinityPredictor
 from .common import configure_logging, set_keras_backend
-from .parallelism import make_worker_pool, cpu_count
+from .parallelism import (
+    make_worker_pool, cpu_count, call_wrapped, call_wrapped_kwargs)
 from .hyperparameters import HyperparameterDefaults
 from .allele_encoding import AlleleEncoding
 
@@ -327,7 +328,9 @@ def run(argv=sys.argv[1:]):
         random.shuffle(work_items)
 
         results_generator = worker_pool.imap_unordered(
-            train_model_entry_point, work_items, chunksize=1)
+            partial(call_wrapped_kwargs, train_model),
+            work_items,
+            chunksize=1)
 
         unsaved_predictors = []
         last_save_time = time.time()
@@ -361,7 +364,7 @@ def run(argv=sys.argv[1:]):
         # as it goes so no saving is required at the end.
         for _ in tqdm.trange(len(work_items)):
             item = work_items.pop(0)  # want to keep freeing up memory
-            work_predictor = train_model_entry_point(item)
+            work_predictor = train_model(**item)
             assert work_predictor is predictor
         assert not work_items
 
@@ -418,14 +421,13 @@ def run(argv=sys.argv[1:]):
 
             results = worker_pool.imap_unordered(
                 partial(
-                    calibrate_percentile_ranks,
+                    partial(call_wrapped, calibrate_percentile_ranks),
                     predictor=predictor),
                 alleles,
                 chunksize=1)
 
         for result in tqdm.tqdm(results, total=len(alleles)):
             predictor.allele_to_percent_rank_transform.update(result)
-
         print("Done calibrating %d additional alleles." % len(alleles))
         predictor.save(args.out_models_dir, model_names_to_write=[])
 
@@ -440,10 +442,6 @@ def run(argv=sys.argv[1:]):
     print("Predictor written to: %s" % args.out_models_dir)
 
 
-def train_model_entry_point(item):
-    return train_model(**item)
-
-
 def alleles_by_similarity(allele):
     global GLOBAL_DATA
     allele_similarity = GLOBAL_DATA['allele_similarity_matrix']
diff --git a/test/test_train_allele_specific_models_command.py b/test/test_train_allele_specific_models_command.py
index 12fcaa3d..fab19ce7 100644
--- a/test/test_train_allele_specific_models_command.py
+++ b/test/test_train_allele_specific_models_command.py
@@ -2,10 +2,10 @@ import json
 import os
 import shutil
 import tempfile
+import subprocess
 
 from numpy.testing import assert_array_less, assert_equal
 
-from mhcflurry import train_allele_specific_models_command
 from mhcflurry import Class1AffinityPredictor
 from mhcflurry.downloads import get_path
 
@@ -57,6 +57,7 @@ def run_and_check(n_jobs=0):
         json.dump(HYPERPARAMETERS, fd)
 
     args = [
+        "mhcflurry-class1-train-allele-specific-models",
         "--data", get_path("data_curated", "curated_training_data.no_mass_spec.csv.bz2"),
         "--hyperparameters", hyperparameters_filename,
         "--allele", "HLA-A*02:01", "HLA-A*01:01", "HLA-A*03:01",
@@ -66,7 +67,7 @@ def run_and_check(n_jobs=0):
         "--ignore-inequalities",
     ]
     print("Running with args: %s" % args)
-    train_allele_specific_models_command.run(args)
+    subprocess.check_call(args)
 
     result = Class1AffinityPredictor.load(models_dir)
     predictions = result.predict(
@@ -84,8 +85,9 @@ def run_and_check(n_jobs=0):
     shutil.rmtree(models_dir)
 
 
-def Xtest_run_parallel():
-    run_and_check(n_jobs=3)
+if os.environ.get("KERAS_BACKEND") != "theano":
+    def test_run_parallel():
+        run_and_check(n_jobs=3)
 
 
 def test_run_serial():
-- 
GitLab