LLM-Inference

Sleeping

App Files Files Community

mishig HF Staff commited on Jul 17, 2024

Commit

dd66861

unverified ·

1 Parent(s): 35f4e45

Check if model support system prompt (#26)

Browse files

Files changed (2) hide show

src/lib/components/InferencePlayground/InferencePlayground.svelte +15 -6
src/lib/components/InferencePlayground/inferencePlaygroundUtils.ts +5 -7

src/lib/components/InferencePlayground/InferencePlayground.svelte CHANGED Viewed

@@ -1,9 +1,9 @@
 <script lang="ts">
 	import {
 		createHfInference,
-		prepareRequestMessages,
 		handleStreamingResponse,
-		handleNonStreamingResponse
 	} from './inferencePlaygroundUtils';
 	import PlaygroundOptions from './InferencePlaygroundGenerationConfig.svelte';
 	import PlaygroundTokenModal from './InferencePlaygroundHFTokenModal.svelte';
@@ -20,7 +20,7 @@
 	let conversations: Conversation[] = [
 		{
 			id: String(Math.random()),
-			model: '01-ai/Yi-1.5-34B-Chat',
 			config: { temperature: 0.5, maxTokens: 2048, streaming: true },
 			messages: startMessages
 		}
@@ -40,6 +40,8 @@
 	let abortControllers: AbortController[] = [];
 	let waitForNonStreaming = true;
 	onDestroy(() => {
 		for (const abortController of abortControllers) {
 			abortController.abort();
@@ -114,7 +116,10 @@
 	async function runInference(conversation: Conversation) {
 		const startTime = performance.now();
 		const hf = createHfInference(hfToken);
-		const requestMessages = prepareRequestMessages(systemMessage, conversation.messages);
 		if (conversation.config.streaming) {
 			const streamingMessage = { role: 'assistant', content: '' };
@@ -216,12 +221,16 @@
 	<div class=" flex flex-col overflow-y-auto py-3 pr-3">
 		<div
 			class="relative flex flex-1 flex-col gap-6 overflow-y-hidden rounded-r-xl border-x border-y border-gray-200/80 bg-gradient-to-b from-white via-white p-3 shadow-sm dark:border-white/5 dark:from-gray-800/40 dark:via-gray-800/40"
 		>
-			<div class="pb-2 text-sm font-semibold">SYSTEM</div>
 			<textarea
 				name=""
 				id=""
-				placeholder="Enter a custom prompt"
 				bind:value={systemMessage.content}
 				class="absolute inset-x-0 bottom-0 h-full resize-none bg-transparent px-3 pt-10 text-sm outline-none"
 			></textarea>

 <script lang="ts">
 	import {
 		createHfInference,
 		handleStreamingResponse,
+		handleNonStreamingResponse,
+		isSystemPromptSupported
 	} from './inferencePlaygroundUtils';
 	import PlaygroundOptions from './InferencePlaygroundGenerationConfig.svelte';
 	import PlaygroundTokenModal from './InferencePlaygroundHFTokenModal.svelte';
 	let conversations: Conversation[] = [
 		{
 			id: String(Math.random()),
+			model: models[0],
 			config: { temperature: 0.5, maxTokens: 2048, streaming: true },
 			messages: startMessages
 		}
 	let abortControllers: AbortController[] = [];
 	let waitForNonStreaming = true;
+	$: systemPromptSupported = isSystemPromptSupported(conversations[0].model);
 	onDestroy(() => {
 		for (const abortController of abortControllers) {
 			abortController.abort();
 	async function runInference(conversation: Conversation) {
 		const startTime = performance.now();
 		const hf = createHfInference(hfToken);
+		const requestMessages = [
+			...(systemPromptSupported && systemMessage?.content?.length ? [systemMessage] : []),
+			...conversation.messages
+		];
 		if (conversation.config.streaming) {
 			const streamingMessage = { role: 'assistant', content: '' };
 	<div class=" flex flex-col overflow-y-auto py-3 pr-3">
 		<div
 			class="relative flex flex-1 flex-col gap-6 overflow-y-hidden rounded-r-xl border-x border-y border-gray-200/80 bg-gradient-to-b from-white via-white p-3 shadow-sm dark:border-white/5 dark:from-gray-800/40 dark:via-gray-800/40"
+			class:pointer-events-none={!systemPromptSupported}
+			class:opacity-70={!systemPromptSupported}
 		>
+			<div class="pb-2 text-sm font-semibold uppercase">system</div>
 			<textarea
 				name=""
 				id=""
+				placeholder={systemPromptSupported
+					? 'Enter a custom prompt'
+					: 'System prompt is not supported with the chosen model.'}
 				bind:value={systemMessage.content}
 				class="absolute inset-x-0 bottom-0 h-full resize-none bg-transparent px-3 pt-10 text-sm outline-none"
 			></textarea>

src/lib/components/InferencePlayground/inferencePlaygroundUtils.ts CHANGED Viewed

@@ -1,17 +1,11 @@
 import { type ChatCompletionInputMessage } from '@huggingface/tasks';
 import { HfInference } from '@huggingface/inference';
 export function createHfInference(token: string): HfInference {
 	return new HfInference(token);
 }
-export function prepareRequestMessages(
-	systemMessage: ChatCompletionInputMessage,
-	messages: ChatCompletionInputMessage[]
-): ChatCompletionInputMessage[] {
-	return [...(systemMessage.content.length ? [systemMessage] : []), ...messages];
-}
 export async function handleStreamingResponse(
 	hf: HfInference,
 	model: string,
@@ -65,3 +59,7 @@ export async function handleNonStreamingResponse(
 	}
 	throw new Error('No response from the model');
 }

 import { type ChatCompletionInputMessage } from '@huggingface/tasks';
 import { HfInference } from '@huggingface/inference';
+import type { ModelEntryWithTokenizer } from '$lib/types';
 export function createHfInference(token: string): HfInference {
 	return new HfInference(token);
 }
 export async function handleStreamingResponse(
 	hf: HfInference,
 	model: string,
 	}
 	throw new Error('No response from the model');
 }
+export function isSystemPromptSupported(model: ModelEntryWithTokenizer) {
+	return model.tokenizerConfig.chat_template?.includes('system');
+}