Spaces:

huggingface
/

inference-playground

Running

App Files Files Community

mishig HF staff commited on Jul 17, 2024

Commit

7956c78

unverified ·

1 Parent(s): e779e06

Fetch compatible models & their tokenizer files server side (#25)

Browse files

Files changed (4) hide show

src/lib/components/InferencePlayground/InferencePlayground.svelte +12 -20
src/lib/types/index.d.ts +9 -0
src/routes/+page.server.ts +34 -0
src/routes/+page.svelte +2 -1

src/lib/components/InferencePlayground/InferencePlayground.svelte CHANGED Viewed

@@ -9,11 +9,11 @@
 	import PlaygroundTokenModal from './InferencePlaygroundHFTokenModal.svelte';
 	import PlaygroundModelSelector from './InferencePlaygroundModelSelector.svelte';
 	import Conversation from './InferencePlaygroundConversation.svelte';
-	import { onMount } from 'svelte';
-	import { type ModelEntry } from '@huggingface/hub';
 	import { type ChatCompletionInputMessage } from '@huggingface/tasks';
-	let compatibleModels: ModelEntry[] = [];
 	const startMessages: ChatCompletionInputMessage[] = [{ role: 'user', content: '' }];
@@ -40,21 +40,10 @@
 	let abortControllers: AbortController[] = [];
 	let waitForNonStreaming = true;
-	onMount(() => {
-		(async () => {
-			// TODO: use hfjs.hub listModels after https://github.com/huggingface/huggingface.js/pull/795
-			const res = await fetch(
-				'https://huggingface.co/api/models?pipeline_tag=text-generation&inference=Warm&filter=conversational'
-			);
-			compatibleModels = (await res.json()) as ModelEntry[];
-			compatibleModels.sort((a, b) => a.id.toLowerCase().localeCompare(b.id.toLowerCase()));
-		})();
-		return () => {
-			for (const abortController of abortControllers) {
-				abortController.abort();
-			}
-		};
 	});
 	function addMessage() {
@@ -366,7 +355,10 @@
 			<div
 				class="flex flex-1 flex-col gap-6 overflow-y-hidden rounded-xl border border-gray-200/80 bg-gradient-to-b from-white via-white p-3 shadow-sm dark:border-white/5 dark:from-gray-800/40 dark:via-gray-800/40"
 			>
-				<PlaygroundModelSelector {compatibleModels} bind:currentModel={conversations[0].model} />
 				<div
 					class="group relative -mt-4 flex h-[26px] w-full items-center justify-center gap-2 rounded-lg bg-black px-5 text-sm text-white hover:bg-gray-900 focus:outline-none focus:ring-4 focus:ring-gray-300 dark:border-gray-700 dark:bg-blue-600 dark:hover:bg-blue-700 dark:focus:ring-gray-700"
 				>
@@ -400,7 +392,7 @@
 							];
 						}}
 					>
-						{#each compatibleModels as model}
 							<option value={model.id}>{model.id}</option>
 						{/each}
 					</select>

 	import PlaygroundTokenModal from './InferencePlaygroundHFTokenModal.svelte';
 	import PlaygroundModelSelector from './InferencePlaygroundModelSelector.svelte';
 	import Conversation from './InferencePlaygroundConversation.svelte';
+	import { onDestroy } from 'svelte';
 	import { type ChatCompletionInputMessage } from '@huggingface/tasks';
+	import type { ModelEntryWithTokenizer } from '$lib/types';
+	export let models: ModelEntryWithTokenizer[];
 	const startMessages: ChatCompletionInputMessage[] = [{ role: 'user', content: '' }];
 	let abortControllers: AbortController[] = [];
 	let waitForNonStreaming = true;
+	onDestroy(() => {
+		for (const abortController of abortControllers) {
+			abortController.abort();
+		}
 	});
 	function addMessage() {
 			<div
 				class="flex flex-1 flex-col gap-6 overflow-y-hidden rounded-xl border border-gray-200/80 bg-gradient-to-b from-white via-white p-3 shadow-sm dark:border-white/5 dark:from-gray-800/40 dark:via-gray-800/40"
 			>
+				<PlaygroundModelSelector
+					compatibleModels={models}
+					bind:currentModel={conversations[0].model}
+				/>
 				<div
 					class="group relative -mt-4 flex h-[26px] w-full items-center justify-center gap-2 rounded-lg bg-black px-5 text-sm text-white hover:bg-gray-900 focus:outline-none focus:ring-4 focus:ring-gray-300 dark:border-gray-700 dark:bg-blue-600 dark:hover:bg-blue-700 dark:focus:ring-gray-700"
 				>
 							];
 						}}
 					>
+						{#each models as model}
 							<option value={model.id}>{model.id}</option>
 						{/each}
 					</select>

src/lib/types/index.d.ts CHANGED Viewed

@@ -16,3 +16,12 @@ type Conversation = {
 	config: ModelConfig;
 	messages: ChatCompletionInputMessage[];
 };

 	config: ModelConfig;
 	messages: ChatCompletionInputMessage[];
 };
+interface TokenizerConfig {
+	chat_template?: string;
+	model_max_length?: number;
+}
+export interface ModelEntryWithTokenizer extends ModelEntry {
+	tokenizerConfig: TokenizerConfig;
+}

src/routes/+page.server.ts ADDED Viewed

	@@ -0,0 +1,34 @@

+// src/routes/my-page/page.server.ts
+import type { ModelEntryWithTokenizer } from '$lib/types';
+import type { ModelEntry } from '@huggingface/hub';
+import type { PageServerLoad } from './$types';
+export const load: PageServerLoad = async ({ fetch }) => {
+	const apiUrl =
+		'https://huggingface.co/api/models?pipeline_tag=text-generation&inference=Warm&filter=conversational';
+	const HF_TOKEN = import.meta.env.HF_TOKEN;
+	const res = await fetch(apiUrl, {
+		headers: {
+			Authorization: `Bearer ${HF_TOKEN}`
+		}
+	});
+	let compatibleModels: ModelEntry[] = await res.json();
+	compatibleModels.sort((a, b) => a.id.toLowerCase().localeCompare(b.id.toLowerCase()));
+	compatibleModels = compatibleModels.slice(0, 2);
+	const promises = compatibleModels.map(async (model) => {
+		const configUrl = `https://huggingface.co/${model.modelId}/raw/main/tokenizer_config.json`;
+		const res = await fetch(configUrl, {
+			headers: {
+				Authorization: `Bearer ${HF_TOKEN}`
+			}
+		});
+		const tokenizerConfig = await res.json();
+		return { ...model, tokenizerConfig } satisfies ModelEntryWithTokenizer;
+	});
+	const models: ModelEntryWithTokenizer[] = await Promise.all(promises);
+	return { models };
+};

src/routes/+page.svelte CHANGED Viewed

@@ -1,5 +1,6 @@
 <script lang="ts">
 	import InferencePlayground from '$lib/components/InferencePlayground/InferencePlayground.svelte';
 </script>
-<InferencePlayground />

 <script lang="ts">
+	export let data;
 	import InferencePlayground from '$lib/components/InferencePlayground/InferencePlayground.svelte';
 </script>
+<InferencePlayground models={data.models} />