oliverguhr
/

german-sentiment-bert

Text Classification

Inference Endpoints

Model card Files Files and versions Community

oliverguhr commited on Mar 14, 2022

Commit

70e394e

•

1 Parent(s): 2fcb9be

fixed missing attention mask code

Files changed (1) hide show

README.md +5 -8

README.md CHANGED Viewed

@@ -69,16 +69,13 @@ class SentimentModel():
  def predict_sentiment(self, texts: List[str])-> List[str]:
  texts = [self.clean_text(text) for text in texts]
  # Add special tokens takes care of adding [CLS], [SEP], <s>... tokens in the right way for each model.
- input_ids = self.tokenizer(texts, padding=True, truncation=True, add_special_tokens=True)
- input_ids = torch.tensor(input_ids["input_ids"])
  with torch.no_grad():
- logits = self.model(input_ids)
  label_ids = torch.argmax(logits[0], axis=1)
- labels = [self.model.config.id2label[label_id] for label_id in label_ids.tolist()]
- return labels
  def replace_numbers(self,text: str) -> str:
  return text.replace("0"," null").replace("1"," eins").replace("2"," zwei").replace("3"," drei").replace("4"," vier").replace("5"," fünf").replace("6"," sechs").replace("7"," sieben").replace("8"," acht").replace("9"," neun")

  def predict_sentiment(self, texts: List[str])-> List[str]:
  texts = [self.clean_text(text) for text in texts]
  # Add special tokens takes care of adding [CLS], [SEP], <s>... tokens in the right way for each model.
+ encoded = self.tokenizer.batch_encode_plus(texts,padding=True, add_special_tokens=True,truncation=True, return_tensors="pt")
+ encoded = encoded.to(self.device)
  with torch.no_grad():
+ logits = self.model(**encoded)
  label_ids = torch.argmax(logits[0], axis=1)
+ return [self.model.config.id2label[label_id.item()] for label_id in label_ids]
  def replace_numbers(self,text: str) -> str:
  return text.replace("0"," null").replace("1"," eins").replace("2"," zwei").replace("3"," drei").replace("4"," vier").replace("5"," fünf").replace("6"," sechs").replace("7"," sieben").replace("8"," acht").replace("9"," neun")