2025-07-04 18:26:36 +08:00
|
|
|
from ragflow_sdk import RAGFlow
|
|
|
|
|
2025-07-05 11:36:29 +08:00
|
|
|
#api_key = "ragflow-I5ZDNjMWNhNTdlMjExZjBiOTEwMzI0ZT"
|
|
|
|
#base_url = "http://192.168.107.165:8099"
|
|
|
|
base_url = "http://localhost"
|
|
|
|
api_key = "ragflow-MyMjM2ODE2NThlMTExZjBiMzJlNzY5Mj"
|
2025-07-04 18:26:36 +08:00
|
|
|
|
|
|
|
rag_object = RAGFlow(api_key=api_key, base_url=base_url)
|
|
|
|
#dataset = rag_object.create_dataset(name="kb_1")
|
|
|
|
|
2025-07-05 11:36:29 +08:00
|
|
|
datasets = rag_object.list_datasets()
|
|
|
|
#dataset = rag_object.list_datasets(name="kb_1")
|
|
|
|
dataset = rag_object.list_datasets(name="制度")
|
2025-07-04 18:26:36 +08:00
|
|
|
|
|
|
|
dataset = dataset[0]
|
|
|
|
|
|
|
|
# filename1 = "ragflow.txt"
|
|
|
|
# blob = open(filename1 , "rb").read()
|
|
|
|
# dataset.upload_documents([{"display_name":filename1,"blob":blob}])
|
2025-07-05 11:36:29 +08:00
|
|
|
# for doc in dataset.list_documents( page=0, page_size=12):
|
|
|
|
# print(doc)
|
|
|
|
# print("=========================================")
|
2025-07-04 18:26:36 +08:00
|
|
|
|
|
|
|
|
2025-07-05 11:36:29 +08:00
|
|
|
doc = dataset.list_documents(name= '科技创新管理办法(试行).pdf')
|
2025-07-04 18:26:36 +08:00
|
|
|
doc = doc[0]
|
2025-07-05 11:36:29 +08:00
|
|
|
# doc.update({"parser_config": {"chunk_token_count": 256}})
|
|
|
|
file_path ="G:\\11\\ragflow_api_test\\1.txt"
|
|
|
|
with open(file_path, 'r', encoding='utf-8') as file:
|
|
|
|
file_content = file.read()
|
|
|
|
for num,txt_chunk in enumerate(file_content.split('\n\n')):
|
|
|
|
print(f"处理文本块: {txt_chunk[:30]}...") # 打印前30个字符以示例
|
|
|
|
|
|
|
|
if txt_chunk.strip(): # 确保不是空行
|
|
|
|
chunk = doc.add_chunk(content=txt_chunk)
|
|
|
|
print(f"第{num+1} Chunk添加成功! ID: {chunk.id}")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
# content = '''
|
|
|
|
# 第二章 部门职责>第六条 【财务管理部】
|
|
|
|
# (一) 配合投标相关费用的办理工作;
|
|
|
|
# (二) 负责提供投标所需的相关财务资料。'''
|
|
|
|
# chunk = doc.add_chunk(content=content)
|
|
|
|
# print(f"Chunk添加成功! ID: {chunk.id}")
|
2025-07-04 18:26:36 +08:00
|
|
|
#dataset.upload_documents([{"display_name": "1.txt", "blob": open('1.txt',"rb").read()}])
|
|
|
|
|
|
|
|
# 查询所有知识库
|
|
|
|
# for dataset in rag_object.list_datasets():
|
|
|
|
# print(dataset)
|
|
|
|
|
|
|
|
|
|
|
|
# dataset = rag_object.list_datasets(name = "制度")
|
|
|
|
#print(dataset)
|
|
|
|
|
|
|
|
|