Spaces:
Sleeping
Sleeping
add grobid dependency
Browse files- Dockerfile +7 -0
- app.py +1 -1
Dockerfile
CHANGED
@@ -8,6 +8,13 @@ COPY ./packages.txt /app/packages.txt
|
|
8 |
RUN apt-get update && xargs -r -a /app/packages.txt apt-get install -y && rm -rf /var/lib/apt/lists/*
|
9 |
RUN pip3 install --no-cache-dir -r /app/requirements.txt
|
10 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
11 |
# User
|
12 |
RUN useradd -m -u 1000 user
|
13 |
USER user
|
|
|
8 |
RUN apt-get update && xargs -r -a /app/packages.txt apt-get install -y && rm -rf /var/lib/apt/lists/*
|
9 |
RUN pip3 install --no-cache-dir -r /app/requirements.txt
|
10 |
|
11 |
+
FROM lfoppiano/grobid AS grobid
|
12 |
+
FROM base AS final
|
13 |
+
|
14 |
+
RUN git clone https://github.com/kermitt2/grobid_client_python && \
|
15 |
+
cd grobid_client_python && \
|
16 |
+
python3 setup.py install
|
17 |
+
|
18 |
# User
|
19 |
RUN useradd -m -u 1000 user
|
20 |
USER user
|
app.py
CHANGED
@@ -20,7 +20,7 @@ if uploaded_file is not None:
|
|
20 |
bytes_data = uploaded_file.getvalue()
|
21 |
st.write(len(bytes_data), "bytes")
|
22 |
saved_file_path = save_uploaded_file(uploaded_file)
|
23 |
-
monkeyReader = reader.MonkeyReader('
|
24 |
outline = monkeyReader.readOutline(saved_file_path)
|
25 |
|
26 |
for pre, fill, node in outline:
|
|
|
20 |
bytes_data = uploaded_file.getvalue()
|
21 |
st.write(len(bytes_data), "bytes")
|
22 |
saved_file_path = save_uploaded_file(uploaded_file)
|
23 |
+
monkeyReader = reader.MonkeyReader('lxml')
|
24 |
outline = monkeyReader.readOutline(saved_file_path)
|
25 |
|
26 |
for pre, fill, node in outline:
|