Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -8,11 +8,12 @@ from nltk.data import load
|
|
8 |
import streamlit as st
|
9 |
import sklearn
|
10 |
|
|
|
|
|
11 |
def custom_tokenizer_with_Turkish_stemmer(text):
|
12 |
# tokenize text
|
13 |
# tokens = text.split(" ")
|
14 |
-
|
15 |
-
tokens = tokenizer.tokenize(text)
|
16 |
print(tokens)
|
17 |
stems = [stemmerTR.stem(item.lower()) for item in tokens]
|
18 |
return stems
|
|
|
8 |
import streamlit as st
|
9 |
import sklearn
|
10 |
|
11 |
+
trans_table = {ord(c): None for c in string.punctuation + string.digits}
|
12 |
+
|
13 |
def custom_tokenizer_with_Turkish_stemmer(text):
|
14 |
# tokenize text
|
15 |
# tokens = text.split(" ")
|
16 |
+
tokens = [word for word in nltk.word_tokenize(text.translate(trans_table))]
|
|
|
17 |
print(tokens)
|
18 |
stems = [stemmerTR.stem(item.lower()) for item in tokens]
|
19 |
return stems
|