akuysal commited on
Commit
c83f950
·
1 Parent(s): 8afa1c0

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -1
app.py CHANGED
@@ -3,12 +3,15 @@ from TurkishStemmer import TurkishStemmer
3
  import string
4
  # import for loading python objects (scikit-learn models)
5
  import pickle
 
6
  import streamlit as st
7
  import sklearn
8
 
9
  def custom_tokenizer_with_Turkish_stemmer(text):
10
  # tokenize text
11
- tokens = text.split(" ")
 
 
12
  stems = [stemmerTR.stem(item.lower()) for item in tokens]
13
  return stems
14
 
 
3
  import string
4
  # import for loading python objects (scikit-learn models)
5
  import pickle
6
+ import tokenize
7
  import streamlit as st
8
  import sklearn
9
 
10
  def custom_tokenizer_with_Turkish_stemmer(text):
11
  # tokenize text
12
+ # tokens = text.split(" ")
13
+ tokens = tokenize.tokenize(text)
14
+ print(tokens)
15
  stems = [stemmerTR.stem(item.lower()) for item in tokens]
16
  return stems
17