Spaces:

Dragneel
/

Recon

Running

Dragneel commited on Oct 12, 2023

Commit

47f1219

1 Parent(s): 87458e6

Update sentiment.py

Added: Removing URLs from comments

Files changed (1) hide show

sentiment.py CHANGED Viewed

@@ -80,7 +80,7 @@ def get_reddit_results(query):
     try:
         sub = reddit.subreddit('noveltranslations+progressionfantasy')
-        results = sub.search(query, limit=5)
         results_list = list(results)
@@ -98,7 +98,9 @@ def get_reddit_results(query):
 def transform_text(text):
     text = text.lower()
     text = nltk.word_tokenize(text)
@@ -133,9 +135,9 @@ def analyze_comments(results, query):
         for comment in all_comments:
             comment_body = comment.body
-            print(comment_body)
             text = transform_text(comment_body)
-            print(text)
             comments_for_cloud.append(comment_body)
             if text:

     try:
         sub = reddit.subreddit('noveltranslations+progressionfantasy')
+        results = sub.search(query, limit=2)
         results_list = list(results)
 def transform_text(text):
+    url_pattern = re.compile(r'http[s]?://(?:[a-zA-Z]|[0-9]|[$-_@.&+]|[!*\\(\\),]|(?:%[0-9a-fA-F][0-9a-fA-F]))+')
+    text = url_pattern.sub('', text)
     text = text.lower()
     text = nltk.word_tokenize(text)
         for comment in all_comments:
             comment_body = comment.body
             text = transform_text(comment_body)
             comments_for_cloud.append(comment_body)
             if text: