File size: 1,289 Bytes
ea5c59c
 
 
8d4620d
9ec3b13
ea5c59c
8d4620d
28c51ee
 
8d4620d
 
 
ea5c59c
8d4620d
ea5c59c
1ed0b9b
54f71b8
075ace4
54f71b8
 
 
 
fbb7eab
c1816fd
0ba8479
 
230d178
 
 
 
 
8d4620d
c1816fd
9a0b416
fda22ce
 
 
51b9227
fda22ce
339798f
17f90e8
51b9227
17f90e8
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
import streamlit as st
import pandas as pd
import numpy as np
import os
from grobidmonkey import reader

def save_uploaded_file(uploaded_file):
    file_path = os.path.join("./uploads", uploaded_file.name)
    os.makedirs("./uploads", exist_ok=True)  # Create 'uploads' directory if it doesn't exist
    with open(file_path, "wb") as f:
        f.write(uploaded_file.getbuffer())
    return file_path  # Return the file path as a string

st.title('Paper2Slides')

st.subheader('Upload paper in pdf format')

col1, col2 = st.columns([3, 1])
with col1:
    uploaded_file = st.file_uploader("Choose a file")
with col2:
    option = st.selectbox(
        'Select parsing method.',
        ('monkey', 'x2d', 'lxml'))

if uploaded_file is not None:
    
    st.write(uploaded_file.name)
    bytes_data = uploaded_file.getvalue()
    st.write(len(bytes_data), "bytes")
    
    saved_file_path = save_uploaded_file(uploaded_file)
    monkeyReader = reader.MonkeyReader(option)
    outline = monkeyReader.readOutline(saved_file_path)
    for pre, fill, node in outline:
        st.write("%s%s" % (pre, node.name))
    
    
    # read paper content
    essay = monkeyReader.readEssay(saved_file_path)
    for key, values in essay.items():
        st.write(f"{key}: {', '.join(values)}")