Skip to content
Snippets Groups Projects
Commit ba936075 authored by Tim O'Donnell's avatar Tim O'Donnell
Browse files

fix

parent df5e6b6c
No related branches found
No related tags found
No related merge requests found
......@@ -95,7 +95,7 @@ else
--predictions "$(mhcflurry-downloads path data_mass_spec_benchmark)/predictions/all.mhcflurry.combined" \
--proteome-peptides "$(mhcflurry-downloads path data_mass_spec_benchmark)/proteome_peptides.all.csv.bz2" \
--ppv-multiplier 100 \
--hit-multiplier-to-take 1 \
--hit-multiplier-to-take 2 \
--out "$(pwd)/train_data.csv"
bzip2 -f train_data.csv
fi
......
......@@ -80,9 +80,7 @@ def load_predictions(dirname, result_df=None, columns=None):
manifest_df = manifest_df.loc[manifest_df.col.isin(result_df.columns)]
print("Will load", len(peptides), "peptides and", len(manifest_df), "cols")
for _, row in tqdm.tqdm(manifest_df.iterrows(), total=len(manifest_df)):
for _, row in manifest_df.iterrows():
with open(os.path.join(dirname, row.path), "rb") as fd:
value = numpy.load(fd)['arr_0']
if mask is not None:
......@@ -109,6 +107,9 @@ def run():
print("Subselected to %d monoallelic samples" % hit_df.sample_id.nunique())
hit_df["allele"] = hit_df.hla
hit_df = hit_df.loc[hit_df.allele.str.match("^HLA-[ABC]")]
print("Subselected to %d HLA-A/B/C samples" % hit_df.sample_id.nunique())
if args.exclude_contig:
new_hit_df = hit_df.loc[
hit_df.protein_primary_ensembl_contig.astype(str) !=
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment