fix amino acid letter order

20623c17 · Alex Rubinsteyn · e112e7bc · 20623c17 · 20623c17
Commit 20623c17 authored 9 years ago by Alex Rubinsteyn
--- a/mhcflurry/amino_acid.py
+++ b/mhcflurry/amino_acid.py
@@ -35,6 +35,6 @@ amino_acids = {
    "V": "Valine",
 }

-amino_acid_letters = list(amino_acids.keys())
-amino_acid_names = list(amino_acids.values())
+amino_acid_letters = list(sorted(amino_acids.keys()))
+amino_acid_names = [amino_acids[k] for k in amino_acid_letters]
 amino_acid_letter_indices = {c: i for (i, c) in enumerate(amino_acid_letters)}
--- a/mhcflurry/mhc1_binding_predictor.py
+++ b/mhcflurry/mhc1_binding_predictor.py
@@ -64,11 +64,12 @@ class Mhc1BindingPredictor(object):
                    original_allele_name,))

            with open(json_path, "r") as f:
-                json_string = json.load(f)
-            self.model = model_from_config(json_string)
+                config_dict = json.load(f)
+            print(config_dict)
+            self.model = model_from_config(config_dict)
            self.model.load_weights(hdf_path)
-
            _allele_model_cache[self.allele] = self.model
+            self.model.compile(loss="mse", optimizer="rmsprop")
        else:
            self.model = _allele_model_cache[self.allele]

@@ -91,13 +92,16 @@ class Mhc1BindingPredictor(object):
        """
        Predict binding affinity for 9mer peptides
        """
+        print("peptides", peptides)
        if any(len(peptide) != 9 for peptide in peptides):
            raise ValueError("Can only predict 9mer peptides")
        X = index_encoding(peptides, peptide_length=9)
+        print("X_index", X)
        return self.model.predict(X, verbose=False).flatten()

    def _predict_9mer_peptides_ic50(self, peptides):
        log_y = self._predict_9mer_peptides(peptides)
+        print("log_y", log_y)
        return self._log_to_ic50(log_y)

    def predict_peptides(self, peptides):
@@ -112,18 +116,22 @@ class Mhc1BindingPredictor(object):

        for length, group_peptides in groupby(peptides, lambda x: len(x)):
            group_peptides = list(group_peptides)
+            print("-- input", group_peptides)
            expanded_peptides = expand_9mer_peptides(group_peptides, length)
            n_group = len(group_peptides)
            n_expanded = len(expanded_peptides)
            expansion_factor = int(n_expanded / n_group)
            raw_y = self._predict_9mer_peptides(expanded_peptides)
+            print("raw_y", raw_y)
            median_y = np.zeros(n_group)
            # take the median of each group of log(IC50) values
            for i in range(n_group):
                start = i * expansion_factor
                end = (i + 1) * expansion_factor
                median_y[i] = np.median(raw_y[start:end])
+            print("median_y", median_y)
            ic50 = self._log_to_ic50(median_y)
+            print("ic50", ic50)
            results["Allele"].extend([self.allele] * n_group)
            results["Peptide"].extend(group_peptides)
            results["Prediction"].extend(ic50)