Spaces:

TeamGenKI
/

LLMServer

Paused

App Files Files Community

LLMServer / test-client /client.py

AurelioAguirre

Connection with api. Added test-client

10d4b3b 8 months ago

raw

history blame

4.05 kB

	import logging
	import requests
	from typing import Optional, Dict, Any
	import json

	class LLMEngineClient:
	def __init__(self, base_url: str, timeout: int = 10):
	# Remove /api suffix and ensure proper formatting
	self.base_url = base_url.rstrip('/')
	self.timeout = timeout
	self.logger = logging.getLogger(__name__)

	# Set up logging
	logging.basicConfig(
	level=logging.INFO,
	format='%(asctime)s - %(name)s - %(levelname)s - %(message)s'
	)

	self.logger.info(f"Initialized client with base URL: {self.base_url}")

	def _make_request(self, method: str, endpoint: str, data: Optional[Dict] = None) -> Dict[str, Any]:
	"""Make HTTP request with detailed error handling"""
	url = f"{self.base_url}/{endpoint.lstrip('/')}"
	self.logger.info(f"Making {method} request to: {url}")

	try:
	headers = {
	'Accept': 'application/json',
	'Content-Type': 'application/json' if data else 'application/json'
	}

	response = requests.request(
	method=method,
	url=url,
	json=data if data else None,
	timeout=self.timeout,
	headers=headers
	)

	# Log response details for debugging
	self.logger.debug(f"Response status code: {response.status_code}")
	self.logger.debug(f"Response headers: {response.headers}")
	self.logger.debug(f"Response content: {response.text[:500]}")

	# Check if the response is HTML
	content_type = response.headers.get('content-type', '')
	if 'text/html' in content_type:
	self.logger.error(f"Received HTML response. URL might be incorrect or service might be down.")
	self.logger.error(f"Attempted URL: {url}")
	raise ValueError(f"Server returned HTML instead of JSON. Please check if the URL {url} is correct.")

	response.raise_for_status()

	return response.json()

	except requests.exceptions.ConnectionError as e:
	self.logger.error(f"Failed to connect to {url}: {str(e)}")
	raise ConnectionError(f"Could not connect to LLM Engine at {url}. Is the service running?")

	except requests.exceptions.Timeout as e:
	self.logger.error(f"Request to {url} timed out after {self.timeout}s")
	raise TimeoutError(f"Request timed out after {self.timeout} seconds")

	except requests.exceptions.RequestException as e:
	self.logger.error(f"Request failed: {str(e)}")
	raise

	def check_health(self) -> Dict[str, Any]:
	"""Check if the service is running and get health status"""
	return self._make_request('GET', 'health')

	def initialize_model(self, config: Dict[str, Any]) -> Dict[str, Any]:
	"""Initialize the model with given configuration"""
	return self._make_request('POST', 'initialize', data=config)

	def generate_text(self, request: Dict[str, Any]) -> Dict[str, Any]:
	"""Generate text using the initialized model"""
	return self._make_request('POST', 'generate', data=request)

	def test_connection():
	"""Test the connection to the LLM Engine"""
	# When running on Spaces, we need to use the gradio-provided URL
	base_url = "https://teamgenki-llm-engine.hf.space"
	client = LLMEngineClient(base_url)

	try:
	# Try each endpoint
	client.logger.info("Testing root endpoint...")
	root_response = client._make_request('GET', '')
	client.logger.info(f"Root endpoint response: {root_response}")

	client.logger.info("Testing health endpoint...")
	health_status = client.check_health()
	client.logger.info(f"Health endpoint response: {health_status}")

	return True

	except Exception as e:
	client.logger.error(f"Connection test failed: {str(e)}")
	return False

	if __name__ == "__main__":
	test_connection()