Vipul-Chauhan commited on
Commit
939efdd
·
1 Parent(s): 0525d89

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -0
app.py CHANGED
@@ -2,6 +2,8 @@
2
  import pandas as pd
3
  newsdf_sample = pd.read_excel("200_sample_each_20newsgroup_4k_tfidf.xlsx",engine="openpyxl")
4
 
 
 
5
  #preprocessing for better tokenization (needed for tfidf)
6
  import nltk
7
  nltk.download('stopwords')
 
2
  import pandas as pd
3
  newsdf_sample = pd.read_excel("200_sample_each_20newsgroup_4k_tfidf.xlsx",engine="openpyxl")
4
 
5
+ print("file size",len(newsdf_sample))
6
+
7
  #preprocessing for better tokenization (needed for tfidf)
8
  import nltk
9
  nltk.download('stopwords')