Merge pull request #13 from kabachuha/main

Add oobabooga text generation webui api completer Using [my fork](https://github.com/rizerphe/text-generation-webui-with-cors) of the web UI until they add CORS support.
rizerphe · Jun 16, 2023 · a09d86d · a09d86d
2 parents 74273aa + 9afd83b
commit a09d86d
Show file tree

Hide file tree

Showing 5 changed files with 342 additions and 0 deletions.
diff --git a/src/complete/complete.ts b/src/complete/complete.ts
@@ -15,6 +15,14 @@ export interface Model {
 	}>;
 
 	complete: (prompt: Prompt, settings: string) => Promise<string>;
+
+	// The plugin will assure that unload() is called before load()
+	// is called for another model, and that load() is called before
+	// complete() is called for that model. It can, however, call
+	// unload() and load() multiple times for the same model, even
+	// consecutively.
+	load?: () => Promise<void>;
+	unload?: () => Promise<void>;
 }
 
 export interface Completer {

diff --git a/src/complete/completers.ts b/src/complete/completers.ts
@@ -3,10 +3,12 @@ import { OpenAIComplete } from "./completers/openai/openai";
 import { ChatGPTComplete } from "./completers/chatgpt/chatgpt";
 import { JurassicJ2Complete } from "./completers/ai21/ai21";
 import { GooseAIComplete } from "./completers/gooseai/gooseai";
+import { OobaboogaComplete } from "./completers/oobabooga/oobabooga";
 
 export const available: Completer[] = [
 	new ChatGPTComplete(),
 	new OpenAIComplete(),
 	new JurassicJ2Complete(),
 	new GooseAIComplete(),
+	new OobaboogaComplete(),
 ];
diff --git a/src/complete/completers/oobabooga/oobabooga.tsx b/src/complete/completers/oobabooga/oobabooga.tsx
@@ -0,0 +1,266 @@
+import React from "react";
+import { Completer, Model, Prompt } from "../../complete";
+import {
+	SettingsUI as ProviderSettingsUI,
+	Settings,
+	parse_settings,
+} from "./provider_settings";
+import SettingsItem from "../../../components/SettingsItem";
+import { z } from "zod";
+
+export const model_settings_schema = z.object({
+	context_length: z.number().int().nonnegative(),
+	max_new_tokens: z.number().int().nonnegative().optional(),
+	temperature: z.number().nonnegative().optional(),
+	top_p: z.number().nonnegative().optional(),
+	typical_p: z.number().nonnegative().optional(),
+	top_k: z.number().int().nonnegative().optional(),
+	min_length: z.number().int().nonnegative().optional(),
+	penalty_alpha: z.number().nonnegative().optional(),
+	repetition_penalty: z.number().nonnegative().optional(),
+	length_penalty: z.number().nonnegative().optional(),
+	no_repeat_ngram_size: z.number().int().nonnegative().optional(),
+});
+
+const default_model_settings: ModelSettings = {
+	context_length: 4000,
+	max_new_tokens: 120,
+	temperature: 0.3,
+	top_p: 1,
+	typical_p: 1,
+	top_k: 0,
+	min_length: 0,
+	penalty_alpha: 0,
+	repetition_penalty: 1.18,
+	length_penalty: 1,
+	no_repeat_ngram_size: 0,
+};
+const model_settings_fields: {
+	name: string;
+	description: string;
+	field_name: keyof ModelSettings;
+}[] = [
+	{
+		name: "Context length",
+		description: "In characters, how much context should the model get",
+		field_name: "context_length",
+	},
+	{
+		name: "Max new tokens",
+		description: "In tokens, how many tokens should the model generate",
+		field_name: "max_new_tokens",
+	},
+	{
+		name: "Temperature",
+		description: "How creative should the model be",
+		field_name: "temperature",
+	},
+	{
+		name: "Top p",
+		description: "What percentage of tokens should be considered",
+		field_name: "top_p",
+	},
+	{
+		name: "Typical p",
+		description: "Cumulative probability of considered tokens",
+		field_name: "typical_p",
+	},
+	{
+		name: "Top k",
+		description: "How many tokens should be considered (0 = all)",
+		field_name: "top_k",
+	},
+	{
+		name: "Min length",
+		description: "Minimum length of generated text (in tokens)",
+		field_name: "min_length",
+	},
+	{
+		name: "Penalty alpha",
+		description: "Penalty alpha",
+		field_name: "penalty_alpha",
+	},
+	{
+		name: "Repetition penalty",
+		description: "How much should the model avoid repeating itself",
+		field_name: "repetition_penalty",
+	},
+	{
+		name: "Length penalty",
+		description: "How much should the model avoid short outputs",
+		field_name: "length_penalty",
+	},
+	{
+		name: "No repeat ngram size",
+		description: "How long are the sequences that should be kept unique",
+		field_name: "no_repeat_ngram_size",
+	},
+];
+
+export type ModelSettings = z.infer<typeof model_settings_schema>;
+const parse_model_settings = (settings: string): ModelSettings => {
+	try {
+		return model_settings_schema.parse(JSON.parse(settings));
+	} catch (e) {
+		return { context_length: 4000 };
+	}
+};
+
+const model_list_response_schema = z.object({
+	result: z.array(z.string()),
+});
+
+const model_response_schema = z.object({
+	result: z.optional(z.string()),
+});
+
+export default class OobaboogaModel implements Model {
+	id: string;
+	name: string;
+	description: string;
+
+	provider_settings: Settings;
+	Settings = ({
+		settings,
+		saveSettings,
+	}: {
+		settings: string | null;
+		saveSettings: (settings: string) => void;
+	}) => {
+		const parsed_settings = parse_model_settings(settings || "");
+		return (
+			<>
+				{model_settings_fields.map((property) => (
+					<SettingsItem
+						name={property.name}
+						description={property.description}
+					>
+						<input
+							type="number"
+							value={parsed_settings[property.field_name]}
+							placeholder={default_model_settings[
+								property.field_name
+							]?.toString()}
+							onChange={(e) =>
+								saveSettings(
+									JSON.stringify({
+										...parsed_settings,
+										[property.field_name]: parseFloat(
+											e.target.value
+										),
+									})
+								)
+							}
+						/>
+					</SettingsItem>
+				))}
+			</>
+		);
+	};
+
+	constructor(id: string, provider_settings: string) {
+		this.id = id;
+		this.name = id;
+		this.description = `Oobabooga ${id} model`;
+		this.provider_settings = parse_settings(provider_settings);
+	}
+
+	async set_model(): Promise<void> {
+		await fetch(`${this.provider_settings.host_url}/api/v1/model`, {
+			method: "POST",
+			headers: {
+				"Content-Type": "application/json",
+			},
+			body: JSON.stringify({
+				action: "load",
+				model_name: this.id,
+			}),
+		}).then((res) => res.json());
+	}
+
+	async get_current_model(): Promise<string | undefined> {
+		const currently_enabled_model = await fetch(
+			`${this.provider_settings.host_url}/api/v1/model`,
+			{
+				method: "GET",
+				headers: {
+					"Content-Type": "application/json",
+					"Cache-Control": "no-cache",
+				},
+			}
+		).then((res) => res.json());
+
+		return model_response_schema.parse(currently_enabled_model).result;
+	}
+
+	async load(): Promise<void> {
+		const currently_enabled_model = await this.get_current_model();
+		if (currently_enabled_model !== this.id) {
+			await this.set_model();
+		}
+	}
+
+	async create_completion(request: any): Promise<any> {
+		try {
+			const response = await fetch(
+				`${this.provider_settings.host_url}/api/v1/generate`,
+				{
+					method: "POST",
+					headers: {
+						"Content-Type": "application/json",
+					},
+					body: JSON.stringify(request),
+				}
+			).then((res) => res.json());
+
+			return response;
+		} catch (error) {
+			throw new Error(`Request failed: ${error.message}`);
+		}
+	}
+
+	async complete(prompt: Prompt, settings: string): Promise<string> {
+		const parsed_settings = parse_model_settings(settings);
+		const { context_length, ...model_params } = parsed_settings;
+
+		const response = await this.create_completion({
+			...model_params,
+			prompt: prompt.prefix.slice(-context_length),
+			do_sample: true,
+			num_beams: 1,
+			early_stopping: false,
+			seed: -1,
+			add_bos_token: true,
+			ban_eos_token: false,
+			skip_special_tokens: true,
+			stopping_strings: [],
+		});
+
+		return response.results[0].text || "";
+	}
+}
+
+export class OobaboogaComplete implements Completer {
+	id: string = "oobabooga";
+	name: string = "Oobabooga";
+	description: string = "Oobabooga text generation webui";
+
+	async get_models(settings: string) {
+		const models = await fetch(
+			`${parse_settings(settings).host_url}/api/v1/model`,
+			{
+				method: "POST",
+				headers: {
+					"Content-Type": "application/json",
+				},
+				body: JSON.stringify({ action: "list" }),
+			}
+		).then((res) => res.json());
+
+		return model_list_response_schema
+			.parse(models)
+			.result.map((model) => new OobaboogaModel(model, settings));
+	}
+
+	Settings = ProviderSettingsUI;
+}
diff --git a/src/complete/completers/oobabooga/provider_settings.tsx b/src/complete/completers/oobabooga/provider_settings.tsx
@@ -0,0 +1,59 @@
+import * as React from "react";
+import SettingsItem from "../../../components/SettingsItem";
+
+export interface Settings {
+	host_url: string;
+}
+
+const default_settings: Settings = {
+	host_url: "http://localhost:5000",
+};
+
+export const parse_settings = (data: string | null): Settings => {
+	if (data === null) {
+		return default_settings;
+	}
+	try {
+		const settings = JSON.parse(data);
+		if (typeof settings.host_url !== "string") {
+			return default_settings;
+		}
+		return settings;
+	} catch (e) {
+		return default_settings;
+	}
+};
+
+export function SettingsUI({
+	settings,
+	saveSettings,
+}: {
+	settings: string | null;
+	saveSettings: (settings: string) => void;
+}) {
+	return (
+		<SettingsItem
+			name="API URL"
+			description={
+				<>
+					Your{" "}
+					<a href="https://github.com/rizerphe/text-generation-webui-with-cors">
+						oobabooga
+					</a>{" "}
+					api host URL - note that (at least for now) this does not
+					use the original webui, but a modified version that allows
+					CORS requests. Make sure you're running it in text
+					completion (not chat) mode, too.
+				</>
+			}
+		>
+			<input
+				type="text"
+				value={parse_settings(settings).host_url}
+				onChange={(e) =>
+					saveSettings(JSON.stringify({ host_url: e.target.value }))
+				}
+			/>
+		</SettingsItem>
+	);
+}
diff --git a/src/main.tsx b/src/main.tsx
@@ -334,6 +334,12 @@ export default class Companion extends Plugin {
 		return cached;
 	}
 
+	async load_model(model: CompletionCacher) {
+		if (this.last_used_model?.model.id === model.model.id) return;
+		await this.last_used_model?.model?.unload?.();
+		await model?.model?.load?.();
+	}
+
 	async _complete(
 		prefix: string,
 		suffix: string,
@@ -342,6 +348,7 @@ export default class Companion extends Plugin {
 	) {
 		const cacher = await this.get_model(provider, model);
 		if (!cacher) return null;
+		await this.load_model(cacher);
 		const completion = await cacher.complete({
 			prefix: prefix,
 			suffix: suffix,