Reem333 commited on
Commit
524c798
·
verified ·
1 Parent(s): 8e257e5

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -14
app.py CHANGED
@@ -12,17 +12,6 @@ longformer_tokenizer = AutoTokenizer.from_pretrained("allenai/longformer-base-40
12
  bert_model = AutoModelForSequenceClassification.from_pretrained("Reem333/BERT")
13
  bert_tokenizer = AutoTokenizer.from_pretrained("google-bert/bert-base-uncased")
14
 
15
- # Function to extract text from PDF
16
- def extract_text_from_pdf(file_path):
17
- text = ''
18
- try:
19
- with fitz.open(file_path) as pdf_document:
20
- for page_number in range(pdf_document.page_count):
21
- page = pdf_document.load_page(page_number)
22
- text += page.get_text()
23
- except Exception as e:
24
- st.error(f"Error reading PDF file: {e}")
25
- return text
26
 
27
  # Function to predict the class of the text using a specified model and tokenizer
28
  def predict_class(text, model, tokenizer):
@@ -64,13 +53,13 @@ with st.sidebar:
64
  st.markdown("## About")
65
  st.markdown('''
66
  This tool classifies paper citations into different levels based on their number of citations.
67
- Powered by Fine-Tuned [Longformer model](https://huggingface.co/REEM-ALRASHIDI/LongFormer-Paper-Citaion-Classifier) and BERT model with custom data.
68
  ''')
69
  st.markdown("### Class Levels:")
70
- st.markdown("- Level 1: Highly cited papers")
71
  st.markdown("- Level 2: Average cited papers")
72
  st.markdown("- Level 3: More cited papers")
73
- st.markdown("- Level 4: Low cited papers")
74
  st.markdown("---")
75
  st.markdown('Tabuk University')
76
 
 
12
  bert_model = AutoModelForSequenceClassification.from_pretrained("Reem333/BERT")
13
  bert_tokenizer = AutoTokenizer.from_pretrained("google-bert/bert-base-uncased")
14
 
 
 
 
 
 
 
 
 
 
 
 
15
 
16
  # Function to predict the class of the text using a specified model and tokenizer
17
  def predict_class(text, model, tokenizer):
 
53
  st.markdown("## About")
54
  st.markdown('''
55
  This tool classifies paper citations into different levels based on their number of citations.
56
+ Powered by Fine-Tuned [Longformer model](https://huggingface.co/Reem333/LongFormer) and BERT model with custom data.
57
  ''')
58
  st.markdown("### Class Levels:")
59
+ st.markdown("- Level 1: Low cited papers")
60
  st.markdown("- Level 2: Average cited papers")
61
  st.markdown("- Level 3: More cited papers")
62
+ st.markdown("- Level 4: Highly cited papers")
63
  st.markdown("---")
64
  st.markdown('Tabuk University')
65