Pclanglais commited on
Commit
69f42d1
·
verified ·
1 Parent(s): 14fafd9

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +10 -12
app.py CHANGED
@@ -25,8 +25,6 @@ bibliography_classifier = pipeline(
25
  "token-classification", model=bibliography_model, aggregation_strategy="simple", device=device
26
  )
27
 
28
- style_classifier = pipeline("text-classification", model=bibliography_style, tokenizer=tokenizer, device=device)
29
-
30
  # Helper functions
31
  def preprocess_text(text):
32
  text = re.sub(r'<[^>]+>', '', text)
@@ -179,8 +177,8 @@ class CombinedProcessor:
179
  print(entry)
180
  entry = re.sub(r'- ?[\n¶] ?', r'', entry)
181
  entry = re.sub(r' ?[\n¶] ?', r' ', entry)
182
- style = pd.DataFrame(style_classifier(entry, truncation=True, padding=True, top_k=1))
183
- list_style.append(style)
184
  entry = re.sub(r'\s*([;:,\.])\s*', r' \1 ', entry)
185
  #print(entry)
186
  bib_out = bibliography_classifier(entry)
@@ -207,18 +205,19 @@ class CombinedProcessor:
207
  bibtex_entry = create_bibtex_entry(bibtex_data)
208
  bibtex_entries.append(bibtex_entry)
209
 
210
- list_style = pd.concat(list_style)
211
- list_style = list_style.groupby('label')['score'].mean().sort_values(ascending=False).reset_index()
212
- top_style = list_style.iloc[0]['label']
213
- top_style_score = list_style.iloc[0]['score']
214
 
215
  # Create the style information string
216
- style_info = f"Top bibliography style: {top_style} (Mean score: {top_style_score:.6f})"
217
 
218
  # Join BibTeX entries
219
  bibtex_content = "\n\n".join(bibtex_entries)
220
 
221
- return style_info, bibtex_content
 
222
 
223
  # Create the processor instance
224
  processor = CombinedProcessor()
@@ -228,13 +227,12 @@ with gr.Blocks(theme='JohnSmith9982/small_and_pretty') as demo:
228
  gr.HTML("""<h1 style="text-align:center">Reversed Zotero</h1>""")
229
  text_input = gr.Textbox(label="Your text", type="text", lines=10)
230
  text_button = gr.Button("Process Text")
231
- style_output = gr.Textbox(label="Top Style", lines=2)
232
  bibtex_output = gr.Textbox(label="BibTeX Entries", lines=15)
233
 
234
  export_button = gr.Button("Export BibTeX")
235
  export_output = gr.File(label="Exported BibTeX File")
236
 
237
- text_button.click(processor.process, inputs=text_input, outputs=[style_output, bibtex_output])
238
  export_button.click(save_bibtex, inputs=[bibtex_output], outputs=[export_output])
239
 
240
  if __name__ == "__main__":
 
25
  "token-classification", model=bibliography_model, aggregation_strategy="simple", device=device
26
  )
27
 
 
 
28
  # Helper functions
29
  def preprocess_text(text):
30
  text = re.sub(r'<[^>]+>', '', text)
 
177
  print(entry)
178
  entry = re.sub(r'- ?[\n¶] ?', r'', entry)
179
  entry = re.sub(r' ?[\n¶] ?', r' ', entry)
180
+ #style = pd.DataFrame(style_classifier(entry, truncation=True, padding=True, top_k=1))
181
+ #list_style.append(style)
182
  entry = re.sub(r'\s*([;:,\.])\s*', r' \1 ', entry)
183
  #print(entry)
184
  bib_out = bibliography_classifier(entry)
 
205
  bibtex_entry = create_bibtex_entry(bibtex_data)
206
  bibtex_entries.append(bibtex_entry)
207
 
208
+ #list_style = pd.concat(list_style)
209
+ #list_style = list_style.groupby('label')['score'].mean().sort_values(ascending=False).reset_index()
210
+ #top_style = list_style.iloc[0]['label']
211
+ #top_style_score = list_style.iloc[0]['score']
212
 
213
  # Create the style information string
214
+ #style_info = f"Top bibliography style: {top_style} (Mean score: {top_style_score:.6f})"
215
 
216
  # Join BibTeX entries
217
  bibtex_content = "\n\n".join(bibtex_entries)
218
 
219
+ #return style_info, bibtex_content
220
+ return bibtex_content
221
 
222
  # Create the processor instance
223
  processor = CombinedProcessor()
 
227
  gr.HTML("""<h1 style="text-align:center">Reversed Zotero</h1>""")
228
  text_input = gr.Textbox(label="Your text", type="text", lines=10)
229
  text_button = gr.Button("Process Text")
 
230
  bibtex_output = gr.Textbox(label="BibTeX Entries", lines=15)
231
 
232
  export_button = gr.Button("Export BibTeX")
233
  export_output = gr.File(label="Exported BibTeX File")
234
 
235
+ text_button.click(processor.process, inputs=text_input, outputs=[bibtex_output])
236
  export_button.click(save_bibtex, inputs=[bibtex_output], outputs=[export_output])
237
 
238
  if __name__ == "__main__":