m3hrdadfi commited on
Commit
d630b49
·
1 Parent(s): 5a1441b

Merge branch 'main' of https://github.com/m3hrdadfi/typo-detector into main

Browse files
Files changed (1) hide show
  1. app.py +12 -3
app.py CHANGED
@@ -1,8 +1,8 @@
1
  import streamlit as st
2
 
3
  import torch
4
- from transformers import pipeline, set_seed
5
- from transformers import AutoTokenizer
6
 
7
  from libs.normalizer import Normalizer
8
  from libs.examples import LANGUAGES, EXAMPLES
@@ -29,13 +29,22 @@ class TypoDetector:
29
  self.task_name = "token-classification"
30
 
31
  self.tokenizer = None
 
 
32
  self.nlp = None
33
  self.normalizer = None
34
 
35
  def load(self):
36
  if not self.debug:
 
37
  self.tokenizer = AutoTokenizer.from_pretrained(self.model_name_or_path)
38
- self.nlp = pipeline(self.task_name, model=self.model_name_or_path, tokenizer=self.model_name_or_path)
 
 
 
 
 
 
39
 
40
  self.normalizer = Normalizer()
41
 
 
1
  import streamlit as st
2
 
3
  import torch
4
+ from transformers import pipeline
5
+ from transformers import AutoConfig, AutoTokenizer, AutoModelForTokenClassification
6
 
7
  from libs.normalizer import Normalizer
8
  from libs.examples import LANGUAGES, EXAMPLES
 
29
  self.task_name = "token-classification"
30
 
31
  self.tokenizer = None
32
+ self.config = None
33
+ self.model = None
34
  self.nlp = None
35
  self.normalizer = None
36
 
37
  def load(self):
38
  if not self.debug:
39
+ self.config = AutoConfig.from_pretrained(self.model_name_or_path)
40
  self.tokenizer = AutoTokenizer.from_pretrained(self.model_name_or_path)
41
+ self.model = AutoModelForTokenClassification.from_pretrained(self.model_name_or_path, config=config)
42
+ self.nlp = pipeline(
43
+ self.task_name,
44
+ model=self.model,
45
+ tokenizer=self.tokenizer,
46
+ aggregation_strategy="average"
47
+ )
48
 
49
  self.normalizer = Normalizer()
50