text-matching / generation.py
Keane Moraes
extracting keywords from texts
232a10d
raw
history blame
645 Bytes
import openai
from utils import *
import mdforest
class Insights:
EMBEDDING_MAX_TOKENS = 8191
def __init__(self, text:str) -> None:
self.corpus = preprocess(mdforest.clean_markdown(text))
self.text = create_nest_sentences(self.corpus, self.EMBEDDING_MAX_TOKENS)
self.keywords = []
self.model = load_keyword_model()
def generate_topics(self) -> list:
print("We are here for generating topics")
for sentence in self.text:
self.keywords = self.keywords + generate_keywords(self.model, sentence)
return self.keywords