|
from test_sdkbase import TestSdk |
|
from ragflow import RAGFlow |
|
import pytest |
|
from common import API_KEY, HOST_ADDRESS |
|
|
|
|
|
|
|
class TestDataset(TestSdk): |
|
|
|
def test_create_dataset(self): |
|
''' |
|
1. create a kb |
|
2. list the kb |
|
3. get the detail info according to the kb id |
|
4. update the kb |
|
5. delete the kb |
|
''' |
|
|
|
ragflow = RAGFlow(API_KEY, HOST_ADDRESS) |
|
|
|
res = ragflow.create_dataset("kb1") |
|
assert res['code'] == 0 and res['message'] == 'success' |
|
dataset_name = res['data']['dataset_name'] |
|
|
|
def test_list_dataset_success(self): |
|
ragflow = RAGFlow(API_KEY, HOST_ADDRESS) |
|
|
|
response = ragflow.list_dataset() |
|
|
|
code, datasets = response |
|
|
|
assert code == 200 |
|
|
|
def test_list_dataset_with_checking_size_and_name(self): |
|
datasets_to_create = ["dataset1", "dataset2", "dataset3"] |
|
ragflow = RAGFlow(API_KEY, HOST_ADDRESS) |
|
created_response = [ragflow.create_dataset(name) for name in datasets_to_create] |
|
|
|
real_name_to_create = set() |
|
for response in created_response: |
|
assert 'data' in response, "Response is missing 'data' key" |
|
dataset_name = response['data']['dataset_name'] |
|
real_name_to_create.add(dataset_name) |
|
|
|
status_code, listed_data = ragflow.list_dataset(0, 3) |
|
listed_data = listed_data['data'] |
|
|
|
listed_names = {d['name'] for d in listed_data} |
|
assert listed_names == real_name_to_create |
|
assert status_code == 200 |
|
assert len(listed_data) == len(datasets_to_create) |
|
|
|
def test_list_dataset_with_getting_empty_result(self): |
|
ragflow = RAGFlow(API_KEY, HOST_ADDRESS) |
|
datasets_to_create = [] |
|
created_response = [ragflow.create_dataset(name) for name in datasets_to_create] |
|
|
|
real_name_to_create = set() |
|
for response in created_response: |
|
assert 'data' in response, "Response is missing 'data' key" |
|
dataset_name = response['data']['dataset_name'] |
|
real_name_to_create.add(dataset_name) |
|
|
|
status_code, listed_data = ragflow.list_dataset(0, 0) |
|
listed_data = listed_data['data'] |
|
|
|
listed_names = {d['name'] for d in listed_data} |
|
assert listed_names == real_name_to_create |
|
assert status_code == 200 |
|
assert len(listed_data) == 0 |
|
|
|
def test_list_dataset_with_creating_100_knowledge_bases(self): |
|
ragflow = RAGFlow(API_KEY, HOST_ADDRESS) |
|
datasets_to_create = ["dataset1"] * 100 |
|
created_response = [ragflow.create_dataset(name) for name in datasets_to_create] |
|
|
|
real_name_to_create = set() |
|
for response in created_response: |
|
assert 'data' in response, "Response is missing 'data' key" |
|
dataset_name = response['data']['dataset_name'] |
|
real_name_to_create.add(dataset_name) |
|
|
|
status_code, listed_data = ragflow.list_dataset(0, 100) |
|
listed_data = listed_data['data'] |
|
|
|
listed_names = {d['name'] for d in listed_data} |
|
assert listed_names == real_name_to_create |
|
assert status_code == 200 |
|
assert len(listed_data) == 100 |
|
|
|
def test_list_dataset_with_showing_one_dataset(self): |
|
ragflow = RAGFlow(API_KEY, HOST_ADDRESS) |
|
response = ragflow.list_dataset(0, 1) |
|
code, response = response |
|
datasets = response['data'] |
|
assert len(datasets) == 1 |
|
|
|
def test_list_dataset_failure(self): |
|
ragflow = RAGFlow(API_KEY, HOST_ADDRESS) |
|
response = ragflow.list_dataset(-1, -1) |
|
_, res = response |
|
assert "IndexError" in res['message'] |
|
|
|
def test_delete_one_dataset_with_success(self): |
|
|
|
ragflow = RAGFlow(API_KEY, HOST_ADDRESS) |
|
res = ragflow.create_dataset("kb0") |
|
real_dataset_name = res['data']['dataset_name'] |
|
print("name", real_dataset_name) |
|
|
|
result = ragflow.delete_dataset(real_dataset_name) |
|
print(result) |
|
assert result["success"] is True |
|
|
|
def test_delete_dataset_with_not_existing_dataset(self): |
|
ragflow = RAGFlow(API_KEY, HOST_ADDRESS) |
|
res = ragflow.delete_dataset("weird_dataset") |
|
assert res["success"] is False |
|
|
|
|
|
|
|
|