Spaces:

Gigaverse
/

ivrit-ai-streaming

Sleeping

AshDavid12

infer wo runpod

8e3c59e 10 months ago

4.19 kB

	import base64
	import faster_whisper
	import tempfile
	import torch
	import requests

	device = 'cuda' if torch.cuda.is_available() else 'cpu'

	# Load the model from Hugging Face
	model_name = 'ivrit-ai/faster-whisper-v2-d4'
	model = faster_whisper.WhisperModel(model_name, device=device)

	# Maximum data size: 200MB
	MAX_PAYLOAD_SIZE = 200 * 1024 * 1024


	def download_file(url, max_size_bytes, output_filename, api_key=None):
	"""
	Download a file from a given URL with size limit and optional API key.

	Args:
	url (str): The URL of the file to download.
	max_size_bytes (int): Maximum allowed file size in bytes.
	output_filename (str): The name of the file to save the download as.
	api_key (str, optional): API key to be used as a bearer token.

	Returns:
	bool: True if download was successful, False otherwise.
	"""
	try:
	headers = {}
	if api_key:
	headers['Authorization'] = f'Bearer {api_key}'

	response = requests.get(url, stream=True, headers=headers)
	response.raise_for_status()

	file_size = int(response.headers.get('Content-Length', 0))

	if file_size > max_size_bytes:
	print(f"File size ({file_size} bytes) exceeds the maximum allowed size ({max_size_bytes} bytes).")
	return False

	downloaded_size = 0
	with open(output_filename, 'wb') as file:
	for chunk in response.iter_content(chunk_size=8192):
	downloaded_size += len(chunk)
	if downloaded_size > max_size_bytes:
	print(f"Download stopped: Size limit exceeded ({max_size_bytes} bytes).")
	return False
	file.write(chunk)

	print(f"File downloaded successfully: {output_filename}")
	return True

	except requests.RequestException as e:
	print(f"Error downloading file: {e}")
	return False


	def transcribe(job):
	datatype = job['input'].get('type', None)
	if not datatype:
	return {"error": "datatype field not provided. Should be 'blob' or 'url'."}

	if datatype not in ['blob', 'url']:
	return {"error": f"datatype should be 'blob' or 'url', but is {datatype} instead."}

	api_key = job['input'].get('api_key', None)

	with tempfile.TemporaryDirectory() as d:
	audio_file = f'{d}/audio.mp3'

	if datatype == 'blob':
	mp3_bytes = base64.b64decode(job['input']['data'])
	with open(audio_file, 'wb') as file:
	file.write(mp3_bytes)
	elif datatype == 'url':
	success = download_file(job['input']['url'], MAX_PAYLOAD_SIZE, audio_file, api_key)
	if not success:
	return {"error": f"Error downloading data from {job['input']['url']}"}

	result = transcribe_core(audio_file)
	return {'result': result}


	def transcribe_core(audio_file):
	print('Transcribing...')

	ret = {'segments': []}

	segs, _ = model.transcribe(audio_file, language='he', word_timestamps=True)
	for s in segs:
	words = []
	for w in s.words:
	words.append({
	'start': w.start,
	'end': w.end,
	'word': w.word,
	'probability': w.probability
	})

	seg = {
	'id': s.id,
	'seek': s.seek,
	'start': s.start,
	'end': s.end,
	'text': s.text,
	'avg_logprob': s.avg_logprob,
	'compression_ratio': s.compression_ratio,
	'no_speech_prob': s.no_speech_prob,
	'words': words
	}

	print(seg)
	ret['segments'].append(seg)

	return ret


	# The script can be run directly or served using Hugging Face's Gradio app or API
	if __name__ == "__main__":
	# For testing purposes, you can define a sample job and call the transcribe function
	test_job = {
	"input": {
	"type": "url",
	"url": "https://github.com/metaldaniel/HebrewASR-Comparison/raw/main/HaTankistiot_n12-mp3.mp3",
	"api_key": "your_api_key_here" # Optional, replace with actual key if needed
	}
	}
	print(transcribe(test_job))