kornosk
/

bert-political-election2020-twitter-mlm

masked-token-prediction

Inference Endpoints

Model card Files Files and versions Community

kornosk commited on May 10, 2022

Commit

6740229

·

1 Parent(s): 032c5da

Update README.md

Files changed (1) hide show

README.md +9 -6

README.md CHANGED Viewed

@@ -32,30 +32,33 @@ Please see the [official repository](https://github.com/GU-DataLab/stance-detect
 from transformers import BertTokenizer, BertForMaskedLM, pipeline
 import torch
-# choose GPU if available
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
-# select mode path here
 pretrained_LM_path = "kornosk/bert-political-election2020-twitter-mlm"
-# load model
 tokenizer = BertTokenizer.from_pretrained(pretrained_LM_path)
 model = BertForMaskedLM.from_pretrained(pretrained_LM_path)
-# fill mask
 example = "Trump is the [MASK] of USA"
 fill_mask = pipeline('fill-mask', model=model, tokenizer=tokenizer)
 outputs = fill_mask(example)
 print(outputs)
-# see embeddings
 inputs = tokenizer(example, return_tensors="pt")
 outputs = model(**inputs)
 print(outputs)
 # OR you can use this model to train on your downstream task!
-# please consider citing our paper if you feel this is useful :)
 ```
 # Reference

 from transformers import BertTokenizer, BertForMaskedLM, pipeline
 import torch
+# Choose GPU if available
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+# Select mode path here
 pretrained_LM_path = "kornosk/bert-political-election2020-twitter-mlm"
+# Load model
 tokenizer = BertTokenizer.from_pretrained(pretrained_LM_path)
 model = BertForMaskedLM.from_pretrained(pretrained_LM_path)
+# Fill mask
 example = "Trump is the [MASK] of USA"
 fill_mask = pipeline('fill-mask', model=model, tokenizer=tokenizer)
+# Use following line instead of the above one does not work.
+# Huggingface have been updated, newer version accepts a string of model name instead.
+fill_mask = pipeline('fill-mask', model=pretrained_LM_path, tokenizer=tokenizer)
 outputs = fill_mask(example)
 print(outputs)
+# See embeddings
 inputs = tokenizer(example, return_tensors="pt")
 outputs = model(**inputs)
 print(outputs)
 # OR you can use this model to train on your downstream task!
+# Please consider citing our paper if you feel this is useful :)
 ```
 # Reference