com3dian commited on
Commit
47c4ff1
·
1 Parent(s): ca45513

add grobid dependency

Browse files
Files changed (2) hide show
  1. Dockerfile +7 -0
  2. app.py +1 -1
Dockerfile CHANGED
@@ -8,6 +8,13 @@ COPY ./packages.txt /app/packages.txt
8
  RUN apt-get update && xargs -r -a /app/packages.txt apt-get install -y && rm -rf /var/lib/apt/lists/*
9
  RUN pip3 install --no-cache-dir -r /app/requirements.txt
10
 
 
 
 
 
 
 
 
11
  # User
12
  RUN useradd -m -u 1000 user
13
  USER user
 
8
  RUN apt-get update && xargs -r -a /app/packages.txt apt-get install -y && rm -rf /var/lib/apt/lists/*
9
  RUN pip3 install --no-cache-dir -r /app/requirements.txt
10
 
11
+ FROM lfoppiano/grobid AS grobid
12
+ FROM base AS final
13
+
14
+ RUN git clone https://github.com/kermitt2/grobid_client_python && \
15
+ cd grobid_client_python && \
16
+ python3 setup.py install
17
+
18
  # User
19
  RUN useradd -m -u 1000 user
20
  USER user
app.py CHANGED
@@ -20,7 +20,7 @@ if uploaded_file is not None:
20
  bytes_data = uploaded_file.getvalue()
21
  st.write(len(bytes_data), "bytes")
22
  saved_file_path = save_uploaded_file(uploaded_file)
23
- monkeyReader = reader.MonkeyReader('monkey')
24
  outline = monkeyReader.readOutline(saved_file_path)
25
 
26
  for pre, fill, node in outline:
 
20
  bytes_data = uploaded_file.getvalue()
21
  st.write(len(bytes_data), "bytes")
22
  saved_file_path = save_uploaded_file(uploaded_file)
23
+ monkeyReader = reader.MonkeyReader('lxml')
24
  outline = monkeyReader.readOutline(saved_file_path)
25
 
26
  for pre, fill, node in outline: