Spaces:

dstars
/

Internlm2.5_RAG

Sleeping

App Files Files Community

Internlm2.5_RAG / llamaindex_RAG.py

dstars

Add Streamlit + LlamaIndex + 浦语 API project

228bb8f 5 months ago

raw

history blame contribute delete

1.86 kB

	import os
	os.environ['NLTK_DATA'] = '/root/nltk_data'

	from llama_index.core import VectorStoreIndex, SimpleDirectoryReader
	from llama_index.core.settings import Settings
	from llama_index.embeddings.huggingface import HuggingFaceEmbedding
	from llama_index.legacy.callbacks import CallbackManager
	from llama_index.llms.openai_like import OpenAILike


	# Create an instance of CallbackManager
	callback_manager = CallbackManager()

	api_base_url = "https://internlm-chat.intern-ai.org.cn/puyu/api/v1/"
	model = "internlm2.5-latest"
	api_key = os.getenv("API_KEY")

	# api_base_url = "https://api.siliconflow.cn/v1"
	# model = "internlm/internlm2_5-7b-chat"
	# api_key = "请填写 API Key"



	llm =OpenAILike(model=model, api_base=api_base_url, api_key=api_key, is_chat_model=True,callback_manager=callback_manager)


	#初始化一个HuggingFaceEmbedding对象，用于将文本转换为向量表示
	embed_model = HuggingFaceEmbedding(
	#指定了一个预训练的sentence-transformer模型的路径
	model_name="/root/model/sentence-transformer"
	)
	#将创建的嵌入模型赋值给全局设置的embed_model属性，
	#这样在后续的索引构建过程中就会使用这个模型。
	Settings.embed_model = embed_model

	#初始化llm
	Settings.llm = llm

	#从指定目录读取所有文档，并加载数据到内存中
	documents = SimpleDirectoryReader("/root/llamaindex_demo/data").load_data()
	#创建一个VectorStoreIndex，并使用之前加载的文档来构建索引。
	# 此索引将文档转换为向量，并存储这些向量以便于快速检索。
	index = VectorStoreIndex.from_documents(documents)
	# 创建一个查询引擎，这个引擎可以接收查询并返回相关文档的响应。
	query_engine = index.as_query_engine()
	response = query_engine.query("Qwen2Attention是什么?")

	print(response)