-
Notifications
You must be signed in to change notification settings - Fork 62
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Merge pull request #1017 from griffithlab/ref_seq_mouse
Update reference proteome similarity step to work with nonhuman data
- Loading branch information
Showing
8 changed files
with
281 additions
and
27 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
2 changes: 2 additions & 0 deletions
2
.../test_data/calculate_reference_proteome_similarity/Test.all_epitopes.aggregated.mouse.tsv
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,2 @@ | ||
ID E*01:01 G*01:09 Gene AA Change Num Passing Transcripts Best Peptide Best Transcript TSL Allele Pos Prob Pos Num Passing Peptides IC50 MT IC50 WT %ile MT %ile WT RNA Expr RNA VAF Allele Expr RNA Depth DNA VAF Tier Evaluation | ||
22-41920894-41920895-G-C 2 1 ACO2 N1453S 1 KFNPQTDYL ENSMUST00000027032 Not Supported HLA-G*01:09 5 None 3 1262.760 1318.61 0.500 0.6 NA NA NA NA 0.250 Poor Pending |
247 changes: 247 additions & 0 deletions
247
...lculate_reference_proteome_similarity/Test.all_epitopes.aggregated.mouse.tsv.metrics.json
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,247 @@ | ||
{ | ||
"tumor_purity": null, | ||
"vaf_clonal": 0.571, | ||
"vaf_subclonal": 0.286, | ||
"binding_threshold": 500, | ||
"aggregate_inclusion_binding_threshold": 5000, | ||
"trna_vaf": 0.25, | ||
"trna_cov": 10, | ||
"allele_expr_threshold": 2.5, | ||
"maximum_transcript_support_level": 1, | ||
"percentile_threshold": null, | ||
"allele_specific_binding_thresholds": false, | ||
"mt_top_score_metric": "Best", | ||
"wt_top_score_metric": "Corresponding", | ||
"binding_cutoffs": { | ||
"HLA-E*01:01": 500, | ||
"HLA-G*01:09": 500 | ||
}, | ||
"is_allele_specific_binding_cutoff": { | ||
"HLA-E*01:01": false, | ||
"HLA-G*01:09": false | ||
}, | ||
"allele_specific_anchors": false, | ||
"anchor_contribution_threshold": 0.8, | ||
"22-41920894-41920895-G-C": { | ||
"good_binders": { | ||
"Transcript Set 1": { | ||
"peptides": { | ||
"LLPLLPLLL": { | ||
"ic50s_MT": [ | ||
2551.25, | ||
4778.52001953125 | ||
], | ||
"percentiles_MT": [ | ||
0.1700439453125, | ||
6.80078125 | ||
], | ||
"ic50s_WT": [ | ||
3099.81, | ||
4830.5 | ||
], | ||
"percentiles_WT": [ | ||
0.33, | ||
6.9 | ||
], | ||
"hla_types": [ | ||
"HLA-E*01:01", | ||
"HLA-G*01:09" | ||
], | ||
"mutation_position": "6-7", | ||
"problematic_positions": "None", | ||
"individual_ic50_calls": { | ||
"algorithms": [ | ||
"NetMHC", | ||
"PickPocket" | ||
], | ||
"MT": { | ||
"HLA-E*01:01": [ | ||
6891.60986328125, | ||
2551.25 | ||
], | ||
"HLA-G*01:09": [ | ||
"NA", | ||
4778.52001953125 | ||
] | ||
}, | ||
"WT": { | ||
"HLA-E*01:01": [ | ||
9234.71, | ||
3099.81 | ||
], | ||
"HLA-G*01:09": [ | ||
"NA", | ||
4830.5 | ||
] | ||
} | ||
}, | ||
"individual_percentile_calls": { | ||
"algorithms": [ | ||
"NetMHC", | ||
"PickPocket" | ||
], | ||
"MT": { | ||
"HLA-E*01:01": [ | ||
0.1700439453125, | ||
1.400390625 | ||
], | ||
"HLA-G*01:09": [ | ||
"NA", | ||
6.80078125 | ||
] | ||
}, | ||
"WT": { | ||
"HLA-E*01:01": [ | ||
0.33, | ||
2.2 | ||
], | ||
"HLA-G*01:09": [ | ||
"NA", | ||
6.9 | ||
] | ||
} | ||
}, | ||
"individual_el_calls": { | ||
"algorithms": [], | ||
"MT": { | ||
"HLA-E*01:01": [], | ||
"HLA-G*01:09": [] | ||
}, | ||
"WT": { | ||
"HLA-E*01:01": [], | ||
"HLA-G*01:09": [] | ||
} | ||
}, | ||
"individual_el_percentile_calls": { | ||
"algorithms": [], | ||
"MT": { | ||
"HLA-E*01:01": [], | ||
"HLA-G*01:09": [] | ||
}, | ||
"WT": { | ||
"HLA-E*01:01": [], | ||
"HLA-G*01:09": [] | ||
} | ||
}, | ||
"wt_peptide": "LLPLLLLLL" | ||
}, | ||
"LLPLLLLLG": { | ||
"ic50s_MT": [ | ||
4676.22998046875, | ||
"X" | ||
], | ||
"percentiles_MT": [ | ||
5.8984375, | ||
"X" | ||
], | ||
"ic50s_WT": [ | ||
38565.12, | ||
"X" | ||
], | ||
"percentiles_WT": [ | ||
81.0, | ||
"X" | ||
], | ||
"hla_types": [ | ||
"HLA-E*01:01", | ||
"HLA-G*01:09" | ||
], | ||
"mutation_position": "3-4", | ||
"problematic_positions": "None", | ||
"individual_ic50_calls": { | ||
"algorithms": [ | ||
"NetMHC", | ||
"PickPocket" | ||
], | ||
"MT": { | ||
"HLA-E*01:01": [ | ||
31981.0703125, | ||
4676.22998046875 | ||
] | ||
}, | ||
"WT": { | ||
"HLA-E*01:01": [ | ||
42768.73, | ||
38565.12 | ||
] | ||
} | ||
}, | ||
"individual_percentile_calls": { | ||
"algorithms": [ | ||
"NetMHC", | ||
"PickPocket" | ||
], | ||
"MT": { | ||
"HLA-E*01:01": [ | ||
14.0, | ||
5.8984375 | ||
] | ||
}, | ||
"WT": { | ||
"HLA-E*01:01": [ | ||
60.0, | ||
81.0 | ||
] | ||
} | ||
}, | ||
"individual_el_calls": { | ||
"algorithms": [], | ||
"MT": { | ||
"HLA-E*01:01": [] | ||
}, | ||
"WT": { | ||
"HLA-E*01:01": [] | ||
} | ||
}, | ||
"individual_el_percentile_calls": { | ||
"algorithms": [], | ||
"MT": { | ||
"HLA-E*01:01": [] | ||
}, | ||
"WT": { | ||
"HLA-E*01:01": [] | ||
} | ||
}, | ||
"wt_peptide": "LPLLLLLLG" | ||
} | ||
}, | ||
"transcripts": [ | ||
"ENST00000233809.4-IGFBP2-L/LLP-20" | ||
], | ||
"transcript_expr": [ | ||
"NA" | ||
], | ||
"tsl": [ | ||
"Not Supported" | ||
], | ||
"biotype": [ | ||
"protein_coding" | ||
], | ||
"transcript_length": [ | ||
325 | ||
], | ||
"transcript_count": 1, | ||
"peptide_count": 2, | ||
"total_expr": 0 | ||
} | ||
}, | ||
"sets": [ | ||
"Transcript Set 1" | ||
], | ||
"transcript_counts": [ | ||
1 | ||
], | ||
"peptide_counts": [ | ||
2 | ||
], | ||
"set_expr": [ | ||
0 | ||
], | ||
"DNA VAF": 0.891, | ||
"RNA VAF": "NA", | ||
"gene_expr": "NA", | ||
"best_peptide_mt": "LLPLLPLLL", | ||
"best_peptide_wt": "LLPLLLLLL", | ||
"best_hla_allele": "HLA-E*01:01" | ||
} | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -3275,4 +3275,4 @@ | |
"best_peptide_wt": "ATLSRTLLA", | ||
"best_hla_allele": "HLA-E*01:01" | ||
} | ||
} | ||
} |
4 changes: 4 additions & 0 deletions
4
tests/test_data/calculate_reference_proteome_similarity/Test.mouse.fasta
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,4 @@ | ||
>WT.Rp1.ENSMUST00000027032.missense.1453N/S | ||
IAGTLKFNPETDYLTGTDG | ||
>MT.Rp1.ENSMUST00000027032.missense.1453N/S | ||
IAGTLKFNPQTDYLTGTDG |
24 changes: 0 additions & 24 deletions
24
tests/test_data/calculate_reference_proteome_similarity/input.aggregated.tsv
This file was deleted.
Oops, something went wrong.
2 changes: 2 additions & 0 deletions
2
...st_data/calculate_reference_proteome_similarity/output.aggregated.peptide_fasta.mouse.tsv
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,2 @@ | ||
ID E*01:01 G*01:09 Gene AA Change Num Passing Transcripts Best Peptide Best Transcript TSL Allele Pos Prob Pos Num Passing Peptides IC50 MT IC50 WT %ile MT %ile WT RNA Expr RNA VAF Allele Expr RNA Depth DNA VAF Tier Ref Match Evaluation | ||
22-41920894-41920895-G-C 2 1 ACO2 N1453S 1 KFNPQTDYL ENSMUST00000027032 Not Supported HLA-G*01:09 5 None 3 1262.760 1318.61 0.500 0.6 NA NA NA NA 0.250 Poor False Pending |