Spaces:

abugaber
/

aiben

Build error

App Files Files Community

aiben / openai_server /agent_tools /ask_question_about_documents.py

abugaber

Upload folder using huggingface_hub

3943768 verified 6 months ago

raw

history blame

12.6 kB

	import json
	import os
	import argparse
	import re
	import sys
	import time
	import uuid

	if 'src' not in sys.path:
	sys.path.append('src')


	def has_gpu():
	import subprocess
	try:
	result = subprocess.run(['nvidia-smi'], stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
	return result.returncode == 0
	except FileNotFoundError:
	return False


	def get_rag_answer(prompt,
	tag='rag_answer',
	simple=False,
	text_context_list=None, image_files=None, chat_conversation=None,
	model=None,
	system_prompt='auto',
	max_tokens=1024,
	temperature=0,
	stream_output=True,
	guided_json=None,
	response_format='text',
	max_time=120):
	base_url = os.getenv('H2OGPT_OPENAI_BASE_URL')
	assert base_url is not None, "H2OGPT_OPENAI_BASE_URL environment variable is not set"
	server_api_key = os.getenv('H2OGPT_OPENAI_API_KEY', 'EMPTY')

	from openai import OpenAI
	client = OpenAI(base_url=base_url, api_key=server_api_key, timeout=max_time)

	if response_format == 'json_object':
	prompt_summary = prompt
	prompt = None
	else:
	prompt_summary = None

	from openai_server.backend_utils import structure_to_messages
	messages = structure_to_messages(prompt, system_prompt, chat_conversation, image_files)

	extra_body = {}
	if text_context_list:
	extra_body['text_context_list'] = text_context_list
	extra_body['guided_json'] = guided_json
	extra_body['response_format'] = dict(type=response_format)
	if response_format == 'json_object':
	extra_body['langchain_mode'] = "MyData"
	# extra_body['langchain_action'] = "Extract"
	extra_body['langchain_action'] = "Summarize"
	extra_body['prompt_summary'] = prompt_summary
	extra_body['pre_prompt_summary'] = ''
	if simple:
	extra_body['pre_prompt_query'] = ''
	extra_body['prompt_query'] = ''

	responses = client.chat.completions.create(
	messages=messages,
	model=model,
	temperature=temperature,
	max_tokens=max_tokens,
	stream=stream_output,
	extra_body=extra_body,
	)
	text = ''
	tgen0 = time.time()
	verbose = True
	print(f'ENDOFTURN\n')
	if tag:
	print(f'<{tag}>\n')
	if stream_output:
	for chunk in responses:
	delta = chunk.choices[0].delta.content if chunk.choices else None
	if delta:
	text += delta
	print(delta, end='', flush=True)
	if time.time() - tgen0 > max_time:
	if verbose:
	print("\nTook too long for OpenAI or VLLM Chat: %s" % (time.time() - tgen0),
	flush=True)
	break
	else:
	text = responses.choices[0].message.content
	print(text, end='\n', flush=True)
	if tag:
	print(f'\n</{tag}>')
	print(f'\nENDOFTURN\n')
	return text


	def ask_question_about_documents():
	default_max_time = int(os.getenv('H2OGPT_AGENT_OPENAI_TIMEOUT', "120"))
	text_context_list_file = os.getenv('H2OGPT_RAG_TEXT_CONTEXT_LIST')
	chat_conversation_file = os.getenv('H2OGPT_RAG_CHAT_CONVERSATION')
	system_prompt_file = os.getenv('H2OGPT_RAG_SYSTEM_PROMPT')
	b2imgs_file = os.getenv('H2OGPT_RAG_IMAGES')

	if text_context_list_file:
	with open(text_context_list_file, "rt") as f:
	text_context_list = []
	for line in f:
	text_context_list.append(line)
	else:
	text_context_list = []

	if chat_conversation_file:
	with open(chat_conversation_file, "rt") as f:
	chat_conversation = json.loads(f.read())
	else:
	chat_conversation = []
	if system_prompt_file:
	with open(system_prompt_file, "rt") as f:
	system_prompt = f.read()
	else:
	system_prompt = 'auto'
	image_files = []
	if b2imgs_file:
	with open(b2imgs_file, "rt") as f:
	for line in f:
	image_files.append(line)
	else:
	image_files = []

	parser = argparse.ArgumentParser(description="RAG Tool")
	parser.add_argument("--prompt", "--query", type=str, required=True, help="User prompt or query")
	parser.add_argument("--json", action="store_true", default=False, help="Output results as JSON")
	parser.add_argument("--csv", action="store_true", default=False, help="Output results as CSV")
	parser.add_argument("--baseline", required=False, action='store_true',
	help="Whether to get baseline from user docs")
	parser.add_argument("--files", nargs="+", required=False,
	help="Files of documents with optionally additional images to ask question about.")
	parser.add_argument("--urls", nargs="+", required=False,
	help="URLs to ask question about")
	parser.add_argument("-m", "--model", type=str, required=False, help="OpenAI or Open Source model to use")
	parser.add_argument("--timeout", type=float, required=False, default=default_max_time,
	help="Maximum time to wait for response")
	parser.add_argument("--system_prompt", type=str, required=False, default=system_prompt, help="System prompt")
	parser.add_argument("--chat_conversation_file", type=str, required=False,
	help="chat history json list of tuples with each tuple as pair of user then assistant text messages.")
	args = parser.parse_args()

	if not args.model:
	args.model = os.getenv('H2OGPT_AGENT_OPENAI_MODEL')
	if not args.model:
	raise ValueError("Model name must be provided via --model or H2OGPT_AGENT_OPENAI_MODEL environment variable")

	if args.chat_conversation_file:
	with open(args.chat_conversation_file, "rt") as f:
	chat_conversation = json.loads(f.read())

	textual_like_files = {
	".txt": "Text file (UTF-8)",
	".csv": "CSV",
	".toml": "TOML",
	".py": "Python",
	".rst": "reStructuredText",
	".rtf": "Rich Text Format",
	".md": "Markdown",
	#".html": "HTML File",
	#".mhtml": "MHTML File",
	#".htm": "HTML File",
	".xml": "XML",
	".json": "JSON",
	".yaml": "YAML",
	".yml": "YAML",
	".ini": "INI configuration file",
	".log": "Log file",
	".tex": "LaTeX",
	".sql": "SQL file",
	".sh": "Shell script",
	".bat": "Batch file",
	".js": "JavaScript",
	".css": "Cascading Style Sheets",
	".php": "PHP",
	".jsp": "Java Server Pages",
	".pl": "Perl script",
	".r": "R script",
	".lua": "Lua script",
	".conf": "Configuration file",
	".properties": "Java Properties file",
	".tsv": "Tab-Separated Values file",
	".xhtml": "XHTML file",
	".srt": "Subtitle file (SRT)",
	".vtt": "WebVTT file",
	".cpp": "C++ Source file",
	".c": "C Source file",
	".h": "C/C++ Header file",
	".go": "Go Source file",
	}

	files = args.files or []
	urls = args.urls or []
	if files + urls:
	from src.enums import IMAGE_EXTENSIONS
	for filename in files + urls:
	if any(filename.lower().endswith(x.lower()) for x in textual_like_files.keys()):
	with open(filename, "rt") as f:
	text_context_list.append(f.read())
	elif any(filename.endswith(x) for x in IMAGE_EXTENSIONS):
	image_files.append(filename)
	else:
	from openai_server.agent_tools.convert_document_to_text import get_text
	files1 = [filename] if filename in files else []
	urls1 = [filename] if filename in urls else []
	text_context_list = [get_text(files1, urls1)]

	rag_kwargs = dict(text_context_list=text_context_list,
	image_files=image_files,
	chat_conversation=chat_conversation,
	model=args.model,
	system_prompt=args.system_prompt,
	max_time=args.timeout,
	)

	is_small = len(text_context_list) < 4 * 1024

	if args.csv or is_small:
	if not args.prompt:
	prompt_csv = "Extract all information in a well-organized form as a CSV so it can be used for data analysis or plotting. Try to make a single CSV if possible. Ensure each CSV block of output is inside a code block with triple backticks with the csv language tag."
	else:
	prompt_csv = "Extract requested information in a well-organized form as a CSV so it can be used for data analysis or plotting. Try to make a single CSV if possible. Ensure each CSV block of output is inside a code block with triple backticks with the csv language tag.\n\nRequested information: " + args.prompt
	csv_answer = get_rag_answer(prompt_csv, tag='', simple=True, **rag_kwargs)
	matches = re.findall(r'```(?:[a-zA-Z])\n(.?)```', csv_answer, re.DOTALL)
	for match in matches:
	csv_filename = f"output_{str(uuid.uuid4())[:6]}.csv"
	with open(csv_filename, "wt") as f:
	f.write(match)
	print(f"CSV output written to {csv_filename}. You can use this with code generation in order to answer the user's question or obtain some intermediate step using pandas etc. Remember, you are not good at solving puzzles, math, or doing question-answer on tabular data, so use these results in python code in order to solve such tasks.\n")

	if args.json:
	json_kwargs = rag_kwargs.copy()
	json_kwargs['guided_json'] = None
	json_kwargs['response_format'] = 'json_object'
	args.prompt = "Extract information in a well-organized form."
	# so json outputted normally
	json_kwargs['stream_output'] = False
	json_tag = 'json_answer'
	json_answer = get_rag_answer(args.prompt, tag=json_tag, **json_kwargs)
	json_filename = f"output_{str(uuid.uuid4())[:6]}.json"
	with open(json_filename, "wt") as f:
	f.write(json_answer)
	print(f"JSON output written to {json_filename}. You can use this with code generation in order to answer the user's question or obtain some intermediate step.\n")

	if args.baseline:
	tag = 'simple_rag_answer'
	else:
	tag = 'rag_answer'
	if not args.json:
	rag_answer = get_rag_answer(args.prompt, tag=tag, **rag_kwargs)

	if rag_answer and args.baseline:
	print(
	"The above simple_rag_answer answer may be correct, but the answer probably requires validation via checking the documents for similar text or search and news APIs if involves recent events. Note that the LLM answering above has no coding capability or internet access so disregard its concerns about that if it mentions it.")


	if __name__ == "__main__":
	ask_question_about_documents()

	"""
	Examples:

	wget https://aiindex.stanford.edu/wp-content/uploads/2024/04/HAI_2024_AI-Index-Report.pdf
	H2OGPT_AGENT_OPENAI_MODEL=claude-3-5-sonnet-20240620 H2OGPT_OPENAI_BASE_URL=http://0.0.0.0:5000/v1 H2OGPT_OPENAI_API_KEY=EMPTY python /home/jon/h2ogpt/openai_server/agent_tools/ask_question_about_documents.py --prompt "Extract AI-related data for Singapore, Israel, Qatar, UAE, Denmark, and Finland from the HAI_2024_AI-Index-Report.pdf. Focus on metrics related to AI implementation, investment, and innovation. Provide a summary of the data in a format suitable for creating a plot." --files HAI_2024_AI-Index-Report.pdf
	H2OGPT_AGENT_OPENAI_MODEL=claude-3-5-sonnet-20240620 H2OGPT_OPENAI_BASE_URL=http://0.0.0.0:5000/v1 H2OGPT_OPENAI_API_KEY=EMPTY python /home/jon/h2ogpt/openai_server/agent_tools/ask_question_about_documents.py --prompt "Give bullet list of top 10 stories." --urls www.cnn.com
	H2OGPT_AGENT_OPENAI_MODEL=claude-3-5-sonnet-20240620 H2OGPT_OPENAI_BASE_URL=http://0.0.0.0:5000/v1 H2OGPT_OPENAI_API_KEY=EMPTY python /home/jon/h2ogpt/openai_server/agent_tools/ask_question_about_documents.py --prompt "Extract AI-related data for Singapore, Israel, Qatar, UAE, Denmark, and Finland from the HAI_2024_AI-Index-Report.pdf. Focus on metrics related to AI implementation, investment, and innovation. Provide a summary of the data in a format suitable for creating a plot." --urls https://aiindex.stanford.edu/wp-content/uploads/2024/04/HAI_2024_AI-Index-Report.pdf
	"""