Spaces:

ArthurSrz
/

borges-graph

Runtime error

App Files Files Community

borges-graph / nano-graphrag /examples /using_ollama_as_llm.py

ArthurSrz

feat: Add complete nano-graphrag source code

70ab3b6 6 months ago

raw

history blame contribute delete

3.05 kB

	import os
	import logging
	import ollama
	from nano_graphrag import GraphRAG, QueryParam
	from nano_graphrag import GraphRAG, QueryParam
	from nano_graphrag.base import BaseKVStorage
	from nano_graphrag._utils import compute_args_hash

	logging.basicConfig(level=logging.WARNING)
	logging.getLogger("nano-graphrag").setLevel(logging.INFO)

	# !!! qwen2-7B maybe produce unparsable results and cause the extraction of graph to fail.
	MODEL = "qwen2"


	async def ollama_model_if_cache(
	prompt, system_prompt=None, history_messages=[], **kwargs
	) -> str:
	# remove kwargs that are not supported by ollama
	kwargs.pop("max_tokens", None)
	kwargs.pop("response_format", None)

	ollama_client = ollama.AsyncClient()
	messages = []
	if system_prompt:
	messages.append({"role": "system", "content": system_prompt})

	# Get the cached response if having-------------------
	hashing_kv: BaseKVStorage = kwargs.pop("hashing_kv", None)
	messages.extend(history_messages)
	messages.append({"role": "user", "content": prompt})
	if hashing_kv is not None:
	args_hash = compute_args_hash(MODEL, messages)
	if_cache_return = await hashing_kv.get_by_id(args_hash)
	if if_cache_return is not None:
	return if_cache_return["return"]
	# -----------------------------------------------------
	response = await ollama_client.chat(model=MODEL, messages=messages, **kwargs)

	result = response["message"]["content"]
	# Cache the response if having-------------------
	if hashing_kv is not None:
	await hashing_kv.upsert({args_hash: {"return": result, "model": MODEL}})
	# -----------------------------------------------------
	return result


	def remove_if_exist(file):
	if os.path.exists(file):
	os.remove(file)


	WORKING_DIR = "./nano_graphrag_cache_ollama_TEST"


	def query():
	rag = GraphRAG(
	working_dir=WORKING_DIR,
	best_model_func=ollama_model_if_cache,
	cheap_model_func=ollama_model_if_cache,
	)
	print(
	rag.query(
	"What are the top themes in this story?", param=QueryParam(mode="global")
	)
	)


	def insert():
	from time import time

	with open("./tests/mock_data.txt", encoding="utf-8-sig") as f:
	FAKE_TEXT = f.read()

	remove_if_exist(f"{WORKING_DIR}/vdb_entities.json")
	remove_if_exist(f"{WORKING_DIR}/kv_store_full_docs.json")
	remove_if_exist(f"{WORKING_DIR}/kv_store_text_chunks.json")
	remove_if_exist(f"{WORKING_DIR}/kv_store_community_reports.json")
	remove_if_exist(f"{WORKING_DIR}/graph_chunk_entity_relation.graphml")

	rag = GraphRAG(
	working_dir=WORKING_DIR,
	enable_llm_cache=True,
	best_model_func=ollama_model_if_cache,
	cheap_model_func=ollama_model_if_cache,
	)
	start = time()
	rag.insert(FAKE_TEXT)
	print("indexing time:", time() - start)
	# rag = GraphRAG(working_dir=WORKING_DIR, enable_llm_cache=True)
	# rag.insert(FAKE_TEXT[half_len:])


	if __name__ == "__main__":
	insert()
	query()