MahmoudNasser
commited on
Commit
·
28ee38b
1
Parent(s):
cb8913f
Update Cleaning.py
Browse files- Cleaning.py +4 -4
Cleaning.py
CHANGED
@@ -9,9 +9,9 @@ import os
|
|
9 |
import math
|
10 |
import random
|
11 |
|
12 |
-
isristemmer = ISRIStemmer()
|
13 |
-
def stemming(txt):
|
14 |
-
|
15 |
|
16 |
|
17 |
def remove_singleCharacter(text):
|
@@ -77,7 +77,7 @@ def Remove_unwanted(text):
|
|
77 |
|
78 |
def txt_preprocess(text):
|
79 |
text = normalize_text(text)
|
80 |
-
text = stemming(text)
|
81 |
text = remove_stopwords(text)
|
82 |
text = remove_punctuations(text)
|
83 |
text = Remove_unwanted(text)
|
|
|
9 |
import math
|
10 |
import random
|
11 |
|
12 |
+
# isristemmer = ISRIStemmer()
|
13 |
+
# def stemming(txt):
|
14 |
+
# return isristemmer.stem(txt)
|
15 |
|
16 |
|
17 |
def remove_singleCharacter(text):
|
|
|
77 |
|
78 |
def txt_preprocess(text):
|
79 |
text = normalize_text(text)
|
80 |
+
# text = stemming(text)
|
81 |
text = remove_stopwords(text)
|
82 |
text = remove_punctuations(text)
|
83 |
text = Remove_unwanted(text)
|