improve entity content formatting
This commit is contained in:
2
.gitignore
vendored
2
.gitignore
vendored
@@ -24,3 +24,5 @@ examples/output/
|
||||
.DS_Store
|
||||
#Remove config.ini from repo
|
||||
*.ini
|
||||
build/
|
||||
minirag-venv/
|
||||
|
||||
@@ -10,3 +10,4 @@ tiktoken
|
||||
torch
|
||||
tqdm
|
||||
uvicorn
|
||||
json_repair
|
||||
|
||||
@@ -370,6 +370,16 @@ async def extract_entities(
|
||||
for dp in all_entities_data
|
||||
}
|
||||
await entity_vdb.upsert(data_for_vdb)
|
||||
if entity_vdb is not None:
|
||||
data_for_vdb = {
|
||||
compute_mdhash_id(dp["entity_name"], prefix="ent-"): {
|
||||
"content": dp["entity_name"] + " " + dp["description"],
|
||||
"entity_name": dp["entity_name"],
|
||||
}
|
||||
for dp in all_entities_data
|
||||
}
|
||||
await entity_vdb.upsert(data_for_vdb)
|
||||
|
||||
if entity_name_vdb is not None:
|
||||
data_for_vdb = {
|
||||
compute_mdhash_id(dp["entity_name"], prefix="Ename-"): {
|
||||
@@ -386,12 +396,13 @@ async def extract_entities(
|
||||
"src_id": dp["src_id"],
|
||||
"tgt_id": dp["tgt_id"],
|
||||
"content": dp["keywords"]
|
||||
+ dp["src_id"]
|
||||
+ dp["tgt_id"]
|
||||
+ dp["description"],
|
||||
+ " " + dp["src_id"]
|
||||
+ " " + dp["tgt_id"]
|
||||
+ " " + dp["description"],
|
||||
}
|
||||
for dp in all_relationships_data
|
||||
}
|
||||
|
||||
await relationships_vdb.upsert(data_for_vdb)
|
||||
|
||||
return knowledge_graph_inst
|
||||
|
||||
Reference in New Issue
Block a user