Add missing protein_seq value so code block works end-to-end
Browse filesBased protein_seq here on https://github.com/BiomedSciAI/biomed-multi-alignment/blob/main/mammal/examples/protein_solubility/main_infer.py
Dean Elzinga [email protected]
README.md
CHANGED
@@ -54,6 +54,9 @@ model.eval()
|
|
54 |
# Load Tokenizer
|
55 |
tokenizer_op = ModularTokenizerOp.from_pretrained("ibm/biomed.omics.bl.sm.ma-ted-458m.protein_solubility")
|
56 |
|
|
|
|
|
|
|
57 |
# convert to MAMMAL style
|
58 |
sample_dict = {"protein_seq": protein_seq}
|
59 |
sample_dict = ProteinSolubilityTask.data_preprocessing(
|
|
|
54 |
# Load Tokenizer
|
55 |
tokenizer_op = ModularTokenizerOp.from_pretrained("ibm/biomed.omics.bl.sm.ma-ted-458m.protein_solubility")
|
56 |
|
57 |
+
# protein_seq: FASTA sequence of a protein, input for the model to predict its solubility
|
58 |
+
protein_seq = "NLMKRCTRGFRKLGKCTTLEEEKCKTLYPRGQCTCSDSKMNTHSCDCKSC"
|
59 |
+
|
60 |
# convert to MAMMAL style
|
61 |
sample_dict = {"protein_seq": protein_seq}
|
62 |
sample_dict = ProteinSolubilityTask.data_preprocessing(
|