KevinHuSh
commited on
Commit
·
c127ae4
1
Parent(s):
cd46bb2
layout refine (#115)
Browse files- README.md +1 -1
- api/apps/llm_app.py +13 -2
- api/db/services/llm_service.py +3 -1
- deepdoc/vision/layout_recognizer.py +1 -1
- rag/app/naive.py +1 -1
README.md
CHANGED
@@ -18,7 +18,7 @@ If **vm.max_map_count** is not larger than 65535, please run the following comm
|
|
18 |
121:/ragflow# sudo sysctl -w vm.max_map_count=262144
|
19 |
```
|
20 |
However, this change is not persistent and will be reset after a system reboot.
|
21 |
-
To make the change permanent, you need to update the **/etc/sysctl.conf
|
22 |
Add or update the following line in the file:
|
23 |
```bash
|
24 |
vm.max_map_count=262144
|
|
|
18 |
121:/ragflow# sudo sysctl -w vm.max_map_count=262144
|
19 |
```
|
20 |
However, this change is not persistent and will be reset after a system reboot.
|
21 |
+
To make the change permanent, you need to update the **/etc/sysctl.conf**.
|
22 |
Add or update the following line in the file:
|
23 |
```bash
|
24 |
vm.max_map_count=262144
|
api/apps/llm_app.py
CHANGED
@@ -82,8 +82,19 @@ def set_api_key():
|
|
82 |
@login_required
|
83 |
def my_llms():
|
84 |
try:
|
85 |
-
|
86 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
87 |
except Exception as e:
|
88 |
return server_error_response(e)
|
89 |
|
|
|
82 |
@login_required
|
83 |
def my_llms():
|
84 |
try:
|
85 |
+
res = {}
|
86 |
+
for o in TenantLLMService.get_my_llms(current_user.id):
|
87 |
+
if o["llm_factory"] not in res:
|
88 |
+
res[o["llm_factory"]] = {
|
89 |
+
"tags": o["tags"],
|
90 |
+
"llm": []
|
91 |
+
}
|
92 |
+
res[o["llm_factory"]]["llm"].append({
|
93 |
+
"type": o["model_type"],
|
94 |
+
"name": o["model_name"],
|
95 |
+
"used_token": o["used_tokens"]
|
96 |
+
})
|
97 |
+
return get_json_result(data=res)
|
98 |
except Exception as e:
|
99 |
return server_error_response(e)
|
100 |
|
api/db/services/llm_service.py
CHANGED
@@ -49,7 +49,9 @@ class TenantLLMService(CommonService):
|
|
49 |
LLMFactories.logo,
|
50 |
LLMFactories.tags,
|
51 |
cls.model.model_type,
|
52 |
-
cls.model.llm_name
|
|
|
|
|
53 |
objs = cls.model.select(*fields).join(LLMFactories, on=(cls.model.llm_factory == LLMFactories.name)).where(
|
54 |
cls.model.tenant_id == tenant_id).dicts()
|
55 |
|
|
|
49 |
LLMFactories.logo,
|
50 |
LLMFactories.tags,
|
51 |
cls.model.model_type,
|
52 |
+
cls.model.llm_name,
|
53 |
+
cls.model.used_tokens
|
54 |
+
]
|
55 |
objs = cls.model.select(*fields).join(LLMFactories, on=(cls.model.llm_factory == LLMFactories.name)).where(
|
56 |
cls.model.tenant_id == tenant_id).dicts()
|
57 |
|
deepdoc/vision/layout_recognizer.py
CHANGED
@@ -100,7 +100,7 @@ class LayoutRecognizer(Recognizer):
|
|
100 |
i += 1
|
101 |
|
102 |
for lt in ["footer", "header", "reference", "figure caption",
|
103 |
-
"table caption", "title", "
|
104 |
findLayout(lt)
|
105 |
|
106 |
# add box to figure layouts which has not text box
|
|
|
100 |
i += 1
|
101 |
|
102 |
for lt in ["footer", "header", "reference", "figure caption",
|
103 |
+
"table caption", "title", "table", "text", "figure", "equation"]:
|
104 |
findLayout(lt)
|
105 |
|
106 |
# add box to figure layouts which has not text box
|
rag/app/naive.py
CHANGED
@@ -101,7 +101,7 @@ def chunk(filename, binary=None, from_page=0, to_page=100000, lang="Chinese", ca
|
|
101 |
d = copy.deepcopy(doc)
|
102 |
if pdf_parser:
|
103 |
d["image"], poss = pdf_parser.crop(ck, need_position=True)
|
104 |
-
add_positions(d, poss
|
105 |
ck = pdf_parser.remove_tag(ck)
|
106 |
tokenize(d, ck, eng)
|
107 |
res.append(d)
|
|
|
101 |
d = copy.deepcopy(doc)
|
102 |
if pdf_parser:
|
103 |
d["image"], poss = pdf_parser.crop(ck, need_position=True)
|
104 |
+
add_positions(d, poss)
|
105 |
ck = pdf_parser.remove_tag(ck)
|
106 |
tokenize(d, ck, eng)
|
107 |
res.append(d)
|