hdallatorre
commited on
Commit
·
8eb8eb4
1
Parent(s):
821d743
Update README.md
Browse files
README.md
CHANGED
@@ -40,6 +40,7 @@ import torch
|
|
40 |
# Import the tokenizer and the model
|
41 |
tokenizer = AutoTokenizer.from_pretrained("InstaDeepAI/nucleotide-transformer-500m-1000g")
|
42 |
model = AutoModelForMaskedLM.from_pretrained("InstaDeepAI/nucleotide-transformer-500m-1000g")
|
|
|
43 |
# Create a dummy dna sequence and tokenize it
|
44 |
sequences = ["ATTCCGATTCCGATTCCG", "ATTTCTCTCTCTCTCTGAGATCGATCGATCGAT"]
|
45 |
tokens_ids = tokenizer.batch_encode_plus(sequences, return_tensors="pt", padding="max_length", max_length = max_length)["input_ids"]
|
|
|
40 |
# Import the tokenizer and the model
|
41 |
tokenizer = AutoTokenizer.from_pretrained("InstaDeepAI/nucleotide-transformer-500m-1000g")
|
42 |
model = AutoModelForMaskedLM.from_pretrained("InstaDeepAI/nucleotide-transformer-500m-1000g")
|
43 |
+
|
44 |
# Create a dummy dna sequence and tokenize it
|
45 |
sequences = ["ATTCCGATTCCGATTCCG", "ATTTCTCTCTCTCTCTGAGATCGATCGATCGAT"]
|
46 |
tokens_ids = tokenizer.batch_encode_plus(sequences, return_tensors="pt", padding="max_length", max_length = max_length)["input_ids"]
|