Skip to content
Snippets Groups Projects
Commit 3b83c2bd authored by Alex Rubinsteyn's avatar Alex Rubinsteyn
Browse files

filter modified peptides from generated dataset

parent 5976e85e
No related branches found
No related tags found
No related merge requests found
__version__ = "0.0.6"
__version__ = "0.0.7"
......@@ -168,6 +168,15 @@ if __name__ == "__main__":
combined_df = pd.DataFrame(
combined_columns,
columns=["species", "mhc", "peptide", "peptide_length", "meas"])
# filter out post-translation modifications and peptides with unknown
# residues
modified_peptide_mask = combined_df.peptide.str.contains("+")
n_modified = modified_peptide_mask.sum()
if n_modified > 0:
print("Dropping %d modified peptides" % n_modified)
combined_df = combined_df[~modified_peptide_mask]
print("New entry allele distribution")
for (allele, count) in new_allele_counts.most_common():
print("%s: %d" % (allele, count))
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment