2023-07-04 14:05:27 +00:00
< html >
< head >
< meta charset = "UTF-8" >
< meta name = "viewport" content = "width=device-width, initial-scale=1, maximum-scale=1" / >
2023-08-01 08:56:23 +00:00
< meta name = "color-scheme" content = "light dark" >
2023-07-04 14:05:27 +00:00
< title > llama.cpp - chat< / title >
< style >
body {
font-family: system-ui;
font-size: 90%;
}
2024-06-01 19:31:48 +00:00
.grid-container {
display: grid;
grid-template-columns: auto auto auto;
padding: 10px;
}
.grid-item {
padding: 5px;
/* font-size: 30px; */
text-align: center;
}
2023-07-04 14:05:27 +00:00
#container {
margin: 0em auto;
display: flex;
flex-direction: column;
justify-content: space-between;
height: 100%;
}
main {
margin: 3px;
display: flex;
flex-direction: column;
justify-content: space-between;
gap: 1em;
flex-grow: 1;
overflow-y: auto;
border: 1px solid #ccc;
border-radius: 5px;
padding: 0.5em;
}
2024-06-01 19:31:48 +00:00
h1 {
text-align: center;
}
.customlink:link {
color: white;
background-color: #007aff;
font-weight: 600;
text-decoration: none;
float: right;
margin-top: 30px;
display: flex;
flex-direction: row;
gap: 0.5em;
justify-content: flex-end;
border-radius: 4px;
padding: 8px;
}
.customlink:visited {
color: white;
background-color: #007aff;
font-weight: 600;
text-decoration: none;
float: right;
margin-top: 30px;
display: flex;
flex-direction: row;
gap: 0.5em;
justify-content: flex-end;
padding: 8px;
}
.customlink:hover {
color: white;
background-color: #0070ee;
font-weight: 600;
text-decoration: none;
float: right;
margin-top: 30px;
display: flex;
flex-direction: row;
gap: 0.5em;
justify-content: flex-end;
padding: 8px;
}
.customlink:active {
color: #0070ee;
background-color: #80b3ef;
font-weight: 600;
text-decoration: none;
float: right;
margin-top: 30px;
display: flex;
flex-direction: row;
gap: 0.5em;
justify-content: flex-end;
padding: 8px;
}
2023-07-04 14:05:27 +00:00
body {
max-width: 600px;
min-width: 300px;
line-height: 1.2;
margin: 0 auto;
padding: 0 0.5em;
}
p {
overflow-wrap: break-word;
word-wrap: break-word;
hyphens: auto;
margin-top: 0.5em;
margin-bottom: 0.5em;
}
#write form {
margin: 1em 0 0 0;
display: flex;
flex-direction: column;
gap: 0.5em;
align-items: stretch;
}
2024-07-25 22:10:16 +00:00
.message-controls {
2023-07-04 14:05:27 +00:00
display: flex;
justify-content: flex-end;
}
2024-07-25 22:10:16 +00:00
.message-controls > div:nth-child(2) {
display: flex;
flex-direction: column;
gap: 0.5em;
}
.message-controls > div:nth-child(2) > div {
display: flex;
margin-left: auto;
gap: 0.5em;
}
2023-07-04 14:05:27 +00:00
fieldset {
border: none;
padding: 0;
margin: 0;
}
2023-07-24 14:54:22 +00:00
fieldset.two {
display: grid;
grid-template: "a a";
gap: 1em;
}
fieldset.three {
display: grid;
grid-template: "a a a";
gap: 1em;
}
details {
border: 1px solid #aaa;
border-radius: 4px;
padding: 0.5em 0.5em 0;
margin-top: 0.5em;
}
summary {
font-weight: bold;
margin: -0.5em -0.5em 0;
padding: 0.5em;
cursor: pointer;
}
details[open] {
padding: 0.5em;
}
2023-08-25 10:32:45 +00:00
.prob-set {
padding: 0.3em;
border-bottom: 1px solid #ccc;
}
.popover-content {
position: absolute;
background-color: white;
padding: 0.2em;
box-shadow: 0 0 10px rgba(0, 0, 0, 0.1);
}
2023-07-24 14:54:22 +00:00
2023-07-04 14:05:27 +00:00
textarea {
padding: 5px;
flex-grow: 1;
width: 100%;
}
pre code {
display: block;
background-color: #222;
color: #ddd;
}
2023-10-22 19:53:08 +00:00
2023-07-04 14:05:27 +00:00
code {
font-family: monospace;
padding: 0.1em 0.3em;
border-radius: 3px;
}
fieldset label {
margin: 0.5em 0;
display: block;
}
2023-07-05 20:51:13 +00:00
2023-10-12 06:51:53 +00:00
fieldset label.slim {
margin: 0 0.5em;
display: inline;
}
2023-10-22 19:53:08 +00:00
header,
footer {
2023-07-05 20:51:13 +00:00
text-align: center;
}
footer {
font-size: 80%;
color: #888;
}
2023-08-25 10:32:45 +00:00
2023-10-12 06:51:53 +00:00
.mode-chat textarea[name=prompt] {
height: 4.5em;
}
.mode-completion textarea[name=prompt] {
height: 10em;
}
2023-11-10 22:49:33 +00:00
[contenteditable] {
display: inline-block;
white-space: pre-wrap;
outline: 0px solid transparent;
}
2023-09-04 08:28:55 +00:00
@keyframes loading-bg-wipe {
0% {
background-position: 0%;
}
2023-10-22 19:53:08 +00:00
2023-09-04 08:28:55 +00:00
100% {
background-position: 100%;
}
}
.loading {
--loading-color-1: #eeeeee00;
--loading-color-2: #eeeeeeff;
background-size: 50% 100%;
background-image: linear-gradient(90deg, var(--loading-color-1), var(--loading-color-2), var(--loading-color-1));
animation: loading-bg-wipe 2s linear infinite;
}
2023-08-25 10:32:45 +00:00
@media (prefers-color-scheme: dark) {
2023-09-04 08:28:55 +00:00
.loading {
--loading-color-1: #22222200;
--loading-color-2: #222222ff;
}
2023-10-22 19:53:08 +00:00
2023-08-25 10:32:45 +00:00
.popover-content {
background-color: black;
}
}
2023-07-04 14:05:27 +00:00
< / style >
< script type = "module" >
import {
2023-08-25 10:32:45 +00:00
html, h, signal, effect, computed, render, useSignal, useEffect, useRef, Component
2024-03-27 05:55:29 +00:00
} from './index.js';
2023-07-04 14:05:27 +00:00
2024-03-27 05:55:29 +00:00
import { llama } from './completion.js';
import { SchemaConverter } from './json-schema-to-grammar.mjs';
2024-07-25 22:10:16 +00:00
2023-10-22 19:53:08 +00:00
let selected_image = false;
var slot_id = -1;
2023-07-04 14:05:27 +00:00
const session = signal({
2023-08-18 21:45:36 +00:00
prompt: "This is a conversation between User and Llama, a friendly chatbot. Llama is helpful, kind, honest, good at writing, and never fails to answer any requests immediately and with precision.",
2023-07-04 14:05:27 +00:00
template: "{{prompt}}\n\n{{history}}\n{{char}}:",
historyTemplate: "{{name}}: {{message}}",
transcript: [],
2023-10-12 06:51:53 +00:00
type: "chat", // "chat" | "completion"
2023-08-18 21:45:36 +00:00
char: "Llama",
2023-07-04 14:05:27 +00:00
user: "User",
2023-10-22 19:53:08 +00:00
image_selected: ''
2023-07-04 14:05:27 +00:00
})
const params = signal({
n_predict: 400,
temperature: 0.7,
2023-07-24 14:54:22 +00:00
repeat_last_n: 256, // 0 = disable penalty, -1 = context size
repeat_penalty: 1.18, // 1.0 = disabled
2024-04-04 15:03:00 +00:00
penalize_nl: false,
2024-10-25 16:07:34 +00:00
dry_multiplier: 0.0, // 0.0 = disabled, 0.8 works well
dry_base: 1.75, // 0.0 = disabled
dry_allowed_length: 2, // tokens extending repetitions beyond this receive penalty, 2 works well
dry_penalty_last_n: -1, // how many tokens to scan for repetitions (0 = disable penalty, -1 = context size)
2023-07-24 14:54:22 +00:00
top_k: 40, // < = 0 to use vocab size
2023-12-12 10:12:35 +00:00
top_p: 0.95, // 1.0 = disabled
2023-11-09 02:00:34 +00:00
min_p: 0.05, // 0 = disabled
2024-10-15 10:54:55 +00:00
xtc_probability: 0.0, // 0 = disabled;
xtc_threshold: 0.1, // > 0.5 disables XTC;
2023-07-24 14:54:22 +00:00
typical_p: 1.0, // 1.0 = disabled
presence_penalty: 0.0, // 0.0 = disabled
frequency_penalty: 0.0, // 0.0 = disabled
mirostat: 0, // 0/1/2
mirostat_tau: 5, // target entropy
mirostat_eta: 0.1, // learning rate
2023-08-14 08:20:17 +00:00
grammar: '',
2023-10-22 19:53:08 +00:00
n_probs: 0, // no completion_probabilities,
2024-02-18 19:11:16 +00:00
min_keep: 0, // min probs from each sampler,
2023-10-22 19:53:08 +00:00
image_data: [],
2023-12-15 11:49:01 +00:00
cache_prompt: true,
api_key: ''
2023-07-04 14:05:27 +00:00
})
2023-12-12 09:53:36 +00:00
/* START: Support for storing prompt templates and parameters in browsers LocalStorage */
2023-08-17 23:34:01 +00:00
const local_storage_storageKey = "llamacpp_server_local_storage";
function local_storage_setDataFromObject(tag, content) {
localStorage.setItem(local_storage_storageKey + '/' + tag, JSON.stringify(content));
}
function local_storage_setDataFromRawText(tag, content) {
localStorage.setItem(local_storage_storageKey + '/' + tag, content);
}
function local_storage_getDataAsObject(tag) {
const item = localStorage.getItem(local_storage_storageKey + '/' + tag);
if (!item) {
return null;
} else {
return JSON.parse(item);
}
}
function local_storage_getDataAsRawText(tag) {
const item = localStorage.getItem(local_storage_storageKey + '/' + tag);
if (!item) {
return null;
} else {
return item;
}
}
// create a container for user templates and settings
const savedUserTemplates = signal({})
const selectedUserTemplate = signal({ name: '', template: { session: {}, params: {} } })
// let's import locally saved templates and settings if there are any
// user templates and settings are stored in one object
// in form of { "templatename": "templatedata" } and { "settingstemplatename":"settingsdata" }
console.log('Importing saved templates')
let importedTemplates = local_storage_getDataAsObject('user_templates')
if (importedTemplates) {
2023-12-12 09:53:36 +00:00
// saved templates were successfully imported.
2023-08-17 23:34:01 +00:00
console.log('Processing saved templates and updating default template')
2023-10-22 19:53:08 +00:00
params.value = { ...params.value, image_data: [] };
2023-08-17 23:34:01 +00:00
//console.log(importedTemplates);
savedUserTemplates.value = importedTemplates;
//override default template
savedUserTemplates.value.default = { session: session.value, params: params.value }
local_storage_setDataFromObject('user_templates', savedUserTemplates.value)
} else {
// no saved templates detected.
console.log('Initializing LocalStorage and saving default template')
savedUserTemplates.value = { "default": { session: session.value, params: params.value } }
local_storage_setDataFromObject('user_templates', savedUserTemplates.value)
}
function userTemplateResetToDefault() {
2023-12-12 09:53:36 +00:00
console.log('Resetting template to default')
2023-08-17 23:34:01 +00:00
selectedUserTemplate.value.name = 'default';
selectedUserTemplate.value.data = savedUserTemplates.value['default'];
}
function userTemplateApply(t) {
session.value = t.data.session;
2023-10-22 19:53:08 +00:00
session.value = { ...session.value, image_selected: '' };
2023-08-17 23:34:01 +00:00
params.value = t.data.params;
2023-10-22 19:53:08 +00:00
params.value = { ...params.value, image_data: [] };
2023-08-17 23:34:01 +00:00
}
function userTemplateResetToDefaultAndApply() {
userTemplateResetToDefault()
userTemplateApply(selectedUserTemplate.value)
}
function userTemplateLoadAndApplyAutosaved() {
// get autosaved last used template
let lastUsedTemplate = local_storage_getDataAsObject('user_templates_last')
if (lastUsedTemplate) {
console.log('Autosaved template found, restoring')
selectedUserTemplate.value = lastUsedTemplate
}
else {
console.log('No autosaved template found, using default template')
// no autosaved last used template was found, so load from default.
userTemplateResetToDefault()
}
console.log('Applying template')
// and update internal data from templates
userTemplateApply(selectedUserTemplate.value)
}
//console.log(savedUserTemplates.value)
//console.log(selectedUserTemplate.value)
function userTemplateAutosave() {
console.log('Template Autosave...')
if (selectedUserTemplate.value.name == 'default') {
// we don't want to save over default template, so let's create a new one
let newTemplateName = 'UserTemplate-' + Date.now().toString()
let newTemplate = { 'name': newTemplateName, 'data': { 'session': session.value, 'params': params.value } }
console.log('Saving as ' + newTemplateName)
// save in the autosave slot
local_storage_setDataFromObject('user_templates_last', newTemplate)
// and load it back and apply
userTemplateLoadAndApplyAutosaved()
} else {
local_storage_setDataFromObject('user_templates_last', { 'name': selectedUserTemplate.value.name, 'data': { 'session': session.value, 'params': params.value } })
}
}
console.log('Checking for autosaved last used template')
userTemplateLoadAndApplyAutosaved()
/* END: Support for storing prompt templates and parameters in browsers LocalStorage */
2024-07-25 22:10:16 +00:00
const tts = window.speechSynthesis;
const ttsVoice = signal(null)
2023-07-05 20:51:13 +00:00
const llamaStats = signal(null)
2023-07-04 14:05:27 +00:00
const controller = signal(null)
2023-07-05 20:51:13 +00:00
2023-09-04 08:28:55 +00:00
// currently generating a completion?
const generating = computed(() => controller.value != null)
// has the user started a chat?
2023-07-05 20:51:13 +00:00
const chatStarted = computed(() => session.value.transcript.length > 0)
const transcriptUpdate = (transcript) => {
session.value = {
...session.value,
transcript
}
}
2023-07-04 14:05:27 +00:00
// simple template replace
const template = (str, extraSettings) => {
let settings = session.value;
if (extraSettings) {
settings = { ...settings, ...extraSettings };
}
return String(str).replaceAll(/\{\{(.*?)\}\}/g, (_, key) => template(settings[key]));
}
2023-10-12 06:51:53 +00:00
async function runLlama(prompt, llamaParams, char) {
const currentMessages = [];
const history = session.value.transcript;
if (controller.value) {
throw new Error("already running");
}
controller.value = new AbortController();
2024-07-23 14:37:42 +00:00
for await (const chunk of llama(prompt, llamaParams, { controller: controller.value, api_url: new URL('.', document.baseURI).href })) {
2023-10-12 06:51:53 +00:00
const data = chunk.data;
if (data.stop) {
while (
currentMessages.length > 0 & &
currentMessages[currentMessages.length - 1].content.match(/\n$/) != null
2023-10-22 19:53:08 +00:00
) {
2023-10-12 06:51:53 +00:00
currentMessages.pop();
}
transcriptUpdate([...history, [char, currentMessages]])
console.log("Completion finished: '", currentMessages.map(msg => msg.content).join(''), "', summary: ", data);
} else {
currentMessages.push(data);
2023-10-22 19:53:08 +00:00
slot_id = data.slot_id;
if (selected_image & & !data.multimodal) {
alert("The server was not compiled for multimodal or the model projector can't be loaded.");
return;
}
2023-10-12 06:51:53 +00:00
transcriptUpdate([...history, [char, currentMessages]])
}
if (data.timings) {
2024-01-02 15:48:49 +00:00
llamaStats.value = data;
2023-10-12 06:51:53 +00:00
}
}
controller.value = null;
}
2023-07-04 14:05:27 +00:00
// send message to server
const chat = async (msg) => {
if (controller.value) {
console.log('already running...');
return;
}
transcriptUpdate([...session.value.transcript, ["{{user}}", msg]])
2023-10-22 19:53:08 +00:00
let prompt = template(session.value.template, {
2023-07-04 14:05:27 +00:00
message: msg,
2023-08-25 10:32:45 +00:00
history: session.value.transcript.flatMap(
([name, data]) =>
template(
session.value.historyTemplate,
{
name,
message: Array.isArray(data) ?
data.map(msg => msg.content).join('').replace(/^\s/, '') :
data,
}
)
).join("\n"),
2023-07-04 14:05:27 +00:00
});
2023-10-22 19:53:08 +00:00
if (selected_image) {
prompt = `A chat between a curious human and an artificial intelligence assistant. The assistant gives helpful, detailed, and polite answers to the human's questions.\nUSER:[img-10]${msg}\nASSISTANT:`;
}
2023-10-12 06:51:53 +00:00
await runLlama(prompt, {
2023-07-04 14:05:27 +00:00
...params.value,
2023-10-22 19:53:08 +00:00
slot_id: slot_id,
2023-07-04 14:05:27 +00:00
stop: ["< / s > ", template("{{char}}:"), template("{{user}}:")],
2023-10-12 06:51:53 +00:00
}, "{{char}}");
}
2023-07-04 14:05:27 +00:00
2023-11-10 22:49:33 +00:00
const runCompletion = () => {
2023-10-12 06:51:53 +00:00
if (controller.value) {
console.log('already running...');
return;
}
2023-10-22 19:53:08 +00:00
const { prompt } = session.value;
2023-10-12 06:51:53 +00:00
transcriptUpdate([...session.value.transcript, ["", prompt]]);
2023-11-10 22:49:33 +00:00
runLlama(prompt, {
2023-10-12 06:51:53 +00:00
...params.value,
2023-10-22 19:53:08 +00:00
slot_id: slot_id,
2023-10-12 06:51:53 +00:00
stop: [],
2023-11-10 22:49:33 +00:00
}, "").finally(() => {
session.value.prompt = session.value.transcript.map(([_, data]) =>
Array.isArray(data) ? data.map(msg => msg.content).join('') : data
).join('');
session.value.transcript = [];
})
2023-10-12 06:51:53 +00:00
}
2023-07-05 20:51:13 +00:00
2023-10-12 06:51:53 +00:00
const stop = (e) => {
e.preventDefault();
if (controller.value) {
controller.value.abort();
controller.value = null;
2023-07-05 20:51:13 +00:00
}
2023-10-12 06:51:53 +00:00
}
2023-07-04 14:05:27 +00:00
2023-10-12 06:51:53 +00:00
const reset = (e) => {
stop(e);
transcriptUpdate([]);
2023-07-04 14:05:27 +00:00
}
2023-10-22 19:53:08 +00:00
const uploadImage = (e) => {
e.preventDefault();
document.getElementById("fileInput").click();
document.getElementById("fileInput").addEventListener("change", function (event) {
const selectedFile = event.target.files[0];
if (selectedFile) {
const reader = new FileReader();
reader.onload = function () {
const image_data = reader.result;
session.value = { ...session.value, image_selected: image_data };
params.value = {
...params.value, image_data: [
{ data: image_data.replace(/data:image\/[^;]+;base64,/, ''), id: 10 }]
}
};
selected_image = true;
reader.readAsDataURL(selectedFile);
}
});
}
2024-07-25 22:10:16 +00:00
const SpeechRecognition = window.SpeechRecognition || window.webkitSpeechRecognition;
const talkRecognition = SpeechRecognition ? new SpeechRecognition() : null;
2023-07-04 14:05:27 +00:00
function MessageInput() {
2024-07-25 22:10:16 +00:00
const message = useSignal("");
const talkActive = useSignal(false);
const sendOnTalk = useSignal(false);
const talkStop = (e) => {
if (e) e.preventDefault();
talkActive.value = false;
talkRecognition?.stop();
}
const talk = (e) => {
e.preventDefault();
if (talkRecognition)
talkRecognition.start();
else
alert("Speech recognition is not supported by this browser.");
}
if(talkRecognition) {
talkRecognition.onstart = () => {
talkActive.value = true;
}
talkRecognition.onresult = (e) => {
if (event.results.length > 0) {
message.value = event.results[0][0].transcript;
if (sendOnTalk.value) {
submit(e);
}
}
}
talkRecognition.onspeechend = () => {
talkStop();
}
}
const ttsVoices = useSignal(tts?.getVoices() || []);
const ttsVoiceDefault = computed(() => ttsVoices.value.find(v => v.default));
if (tts) {
tts.onvoiceschanged = () => {
ttsVoices.value = tts.getVoices();
}
}
2023-07-04 14:05:27 +00:00
const submit = (e) => {
stop(e);
chat(message.value);
message.value = "";
}
const enterSubmits = (event) => {
if (event.which === 13 & & !event.shiftKey) {
submit(event);
}
}
return html`
< form onsubmit = ${submit} >
< div >
2023-09-04 08:28:55 +00:00
< textarea
className=${generating.value ? "loading" : null}
oninput=${(e) => message.value = e.target.value}
onkeypress=${enterSubmits}
placeholder="Say something..."
rows=2
type="text"
value="${message}"
/>
2023-07-04 14:05:27 +00:00
< / div >
2024-07-25 22:10:16 +00:00
< div class = "message-controls" >
< div > < / div >
< div >
< div >
< button type = "submit" disabled = ${generating.value | | talkActive . value } > Send< / button >
< button disabled = ${generating.value | | talkActive . value } onclick = ${uploadImage} > Upload Image< / button >
< button onclick = ${stop} disabled = ${!generating.value} > Stop< / button >
< button onclick = ${reset} > Reset< / button >
< / div >
< div >
< a href = "#" style = "cursor: help;" title = "Help" onclick = ${e = > {
e.preventDefault();
alert(`STT supported by your browser: ${SpeechRecognition ? 'Yes' : 'No'}\n` +
`(TTS and speech recognition are not provided by llama.cpp)\n` +
`Note: STT requires HTTPS to work.`);
}}>[?]< / a >
< button disabled = ${generating.value} onclick = ${talkActive.value ? talkStop : talk } > ${talkActive.value ? "Stop Talking" : "Talk"}< / button >
< div >
< input type = "checkbox" id = "send-on-talk" name = "send-on-talk" checked = "${sendOnTalk}" onchange = ${(e) = > sendOnTalk.value = e.target.checked} />
< label for = "send-on-talk" style = "line-height: initial;" > Send after talking< / label >
< / div >
< / div >
< div >
< a href = "#" style = "cursor: help;" title = "Help" onclick = ${e = > {
e.preventDefault();
alert(`TTS supported by your browser: ${tts ? 'Yes' : 'No'}\n(TTS and speech recognition are not provided by llama.cpp)`);
}}>[?]< / a >
< label for = "tts-voices" style = "line-height: initial;" > Bot Voice:< / label >
< select id = "tts-voices" name = "tts-voices" onchange = ${(e) = > ttsVoice.value = e.target.value} style="max-width: 100px;">
< option value = "" selected = "${!ttsVoice.value}" > None< / option >
${[
...(ttsVoiceDefault.value ? [ttsVoiceDefault.value] : []),
...ttsVoices.value.filter(v => !v.default),
].map(
v => html`< option value = "${v.name}" selected = "${ttsVoice.value === v.name}" > ${v.name} (${v.lang}) ${v.default ? '(default)' : ''}< / option > `
)}
< / select >
< / div >
< / div >
2023-07-04 14:05:27 +00:00
< / div >
< / form >
`
}
2023-10-12 06:51:53 +00:00
function CompletionControls() {
const submit = (e) => {
stop(e);
runCompletion();
}
return html`
2024-04-15 12:18:47 +00:00
< div >
2023-10-12 06:51:53 +00:00
< button onclick = ${submit} type = "button" disabled = ${generating.value} > Start< / button >
< button onclick = ${stop} disabled = ${!generating.value} > Stop< / button >
< button onclick = ${reset} > Reset< / button >
< / div > `;
}
2023-07-04 14:05:27 +00:00
const ChatLog = (props) => {
const messages = session.value.transcript;
const container = useRef(null)
useEffect(() => {
// scroll to bottom (if needed)
2023-08-04 20:16:11 +00:00
const parent = container.current.parentElement;
if (parent & & parent.scrollHeight < = parent.scrollTop + parent.offsetHeight + 300) {
parent.scrollTo(0, parent.scrollHeight)
2023-07-04 14:05:27 +00:00
}
}, [messages])
2024-07-25 22:10:16 +00:00
const ttsChatLineActiveIx = useSignal(undefined);
const ttsChatLine = (e, ix, msg) => {
if (e) e.preventDefault();
if (!tts || !ttsVoice.value || !('SpeechSynthesisUtterance' in window)) return;
const ttsVoices = tts.getVoices();
const voice = ttsVoices.find(v => v.name === ttsVoice.value);
if (!voice) return;
if (ttsChatLineActiveIx.value !== undefined) {
tts.cancel();
if (ttsChatLineActiveIx.value === ix) {
ttsChatLineActiveIx.value = undefined;
return;
}
}
ttsChatLineActiveIx.value = ix;
let ttsUtter = new SpeechSynthesisUtterance(msg);
ttsUtter.voice = voice;
ttsUtter.onend = e => {
ttsChatLineActiveIx.value = undefined;
};
tts.speak(ttsUtter);
}
2023-11-10 22:49:33 +00:00
const isCompletionMode = session.value.type === 'completion'
2024-07-25 22:10:16 +00:00
// Try play the last bot message
const lastCharChatLinesIxs = useSignal([]);
const lastCharChatLinesIxsOld = useSignal([]);
useEffect(() => {
if (
!isCompletionMode
& & lastCharChatLinesIxs.value.length !== lastCharChatLinesIxsOld.value.length
& & !generating.value
) {
const ix = lastCharChatLinesIxs.value[lastCharChatLinesIxs.value.length - 1];
if (ix !== undefined) {
const msg = messages[ix];
ttsChatLine(null, ix, Array.isArray(msg) ? msg[1].map(m => m.content).join('') : msg);
}
lastCharChatLinesIxsOld.value = structuredClone(lastCharChatLinesIxs.value);
}
}, [generating.value]);
2023-08-25 10:32:45 +00:00
const chatLine = ([user, data], index) => {
let message
2024-07-25 22:10:16 +00:00
const isArrayMessage = Array.isArray(data);
const text = isArrayMessage ?
data.map(msg => msg.content).join('') :
data;
2023-08-25 10:32:45 +00:00
if (params.value.n_probs > 0 & & isArrayMessage) {
message = html`< ${Probabilities} data=${data} />`
} else {
2023-11-10 22:49:33 +00:00
message = isCompletionMode ?
text :
html`< ${Markdownish} text=${template(text)} />`
2023-08-25 10:32:45 +00:00
}
2024-07-25 22:10:16 +00:00
const fromBot = user & & user === '{{char}}';
if (fromBot & & !lastCharChatLinesIxs.value.includes(index))
lastCharChatLinesIxs.value.push(index);
2023-10-22 19:53:08 +00:00
if (user) {
2024-07-25 22:10:16 +00:00
return html`
< div >
< p key = ${index} > < strong > ${template(user)}:< / strong > ${message}< / p >
${
fromBot & & ttsVoice.value
& & html`< button disabled = ${generating.value} onclick = ${e = > ttsChatLine(e, index, text)} aria-label=${ttsChatLineActiveIx.value === index ? 'Pause' : 'Play'}>${ ttsChatLineActiveIx.value === index ? '⏸️' : '▶️' }< / div > `
}
< / div >
`;
2023-10-12 06:51:53 +00:00
} else {
2023-11-10 22:49:33 +00:00
return isCompletionMode ?
html`< span key = ${index} > ${message}< / span > ` :
2024-07-25 22:10:16 +00:00
html`< div > < p key = ${index} > ${message}< / p > < / div > `
2023-10-12 06:51:53 +00:00
}
2023-07-04 14:05:27 +00:00
};
2023-11-10 22:49:33 +00:00
const handleCompletionEdit = (e) => {
session.value.prompt = e.target.innerText;
session.value.transcript = [];
}
2023-07-04 14:05:27 +00:00
return html`
2023-11-10 22:49:33 +00:00
< div id = "chat" ref = ${container} key = ${messages.length} >
2023-10-22 19:53:08 +00:00
< img style = "width: 60%;${!session.value.image_selected ? `display: none;` : ``}" src = "${session.value.image_selected}" / >
2023-11-10 22:49:33 +00:00
< span contenteditable = ${isCompletionMode} ref = ${container} oninput = ${handleCompletionEdit} >
${messages.flatMap(chatLine)}
< / span >
< / div > `;
2023-07-04 14:05:27 +00:00
};
const ConfigForm = (props) => {
const updateSession = (el) => session.value = { ...session.value, [el.target.name]: el.target.value }
const updateParams = (el) => params.value = { ...params.value, [el.target.name]: el.target.value }
const updateParamsFloat = (el) => params.value = { ...params.value, [el.target.name]: parseFloat(el.target.value) }
2023-07-24 14:54:22 +00:00
const updateParamsInt = (el) => params.value = { ...params.value, [el.target.name]: Math.floor(parseFloat(el.target.value)) }
2024-04-04 15:03:00 +00:00
const updateParamsBool = (el) => params.value = { ...params.value, [el.target.name]: el.target.checked }
2023-07-24 14:54:22 +00:00
2023-08-14 07:16:54 +00:00
const grammarJsonSchemaPropOrder = signal('')
const updateGrammarJsonSchemaPropOrder = (el) => grammarJsonSchemaPropOrder.value = el.target.value
json-schema-to-grammar improvements (+ added to server) (#5978)
* json: fix arrays (disallow `[,1]`)
* json: support tuple types (`[number, string]`)
* json: support additionalProperties (`{[k: string]: [string,number][]}`)
* json: support required / optional properties
* json: add support for pattern
* json: resolve $ref (and support https schema urls)
* json: fix $ref resolution
* join: support union types (mostly for nullable types I think)
* json: support allOf + nested anyOf
* json: support any (`{}` or `{type: object}`)
* json: fix merge
* json: temp fix for escapes
* json: spaces in output and unrestricted output spaces
* json: add typings
* json:fix typo
* Create ts-type-to-grammar.sh
* json: fix _format_literal (json.dumps already escapes quotes)
* json: merge lit sequences and handle negatives
{"type": "string", "pattern": "^({\"question\": \"[^\"]+\", \"response\": \"[^\"]+\"}\\n)+$"}
* json: handle pattern repetitions
* Update json-schema-to-grammar.mjs
* Create regex-to-grammar.py
* json: extract repeated regexp patterns to subrule
* Update json-schema-to-grammar.py
* Update json-schema-to-grammar.py
* Update json-schema-to-grammar.py
* json: handle schema from pydantic Optional fields
* Update json-schema-to-grammar.py
* Update json-schema-to-grammar.py
* Update ts-type-to-grammar.sh
* Update ts-type-to-grammar.sh
* json: simplify nullable fields handling
* json: accept duplicate identical rules
* json: revert space to 1 at most
* json: reuse regexp pattern subrules
* json: handle uuid string format
* json: fix literal escapes
* json: add --allow-fetch
* json: simplify range escapes
* json: support negative ranges in patterns
* Delete commit.txt
* json: custom regex parser, adds dot support & JS-portable
* json: rm trailing spaces
* Update json-schema-to-grammar.mjs
* json: updated server & chat `( cd examples/server && ./deps.sh )`
* json: port fixes from mjs to python
* Update ts-type-to-grammar.sh
* json: support prefixItems alongside array items
* json: add date format + fix uuid
* json: add date, time, date-time formats
* json: preserve order of props from TS defs
* json: port schema converter to C++, wire in ./server
* json: nits
* Update json-schema-to-grammar.cpp
* Update json-schema-to-grammar.cpp
* Update json-schema-to-grammar.cpp
* json: fix mjs implementation + align outputs
* Update json-schema-to-grammar.mjs.hpp
* json: test C++, JS & Python versions
* json: nits + regen deps
* json: cleanup test
* json: revert from c++17 to 11
* json: nit fixes
* json: dirty include for test
* json: fix zig build
* json: pass static command to std::system in tests (fixed temp files)
* json: fix top-level $refs
* json: don't use c++20 designated initializers
* nit
* json: basic support for reserved names `{number:{number:{root:number}}}`
* Revamp test cmake to allow args (WORKING_DIRECTORY needed for JSON test)
* json: re-ran server deps.sh
* json: simplify test
* json: support mix of additional props & required/optional
* json: add tests for some expected failures
* json: fix type=const in c++, add failure expectations for non-str const&enum
* json: test (& simplify output of) empty schema
* json: check parsing in test + fix value & string refs
* json: add server tests for OAI JSON response_format
* json: test/fix top-level anyOf
* json: improve grammar parsing failures
* json: test/fix additional props corner cases
* json: fix string patterns (was missing quotes)
* json: ws nit
* json: fix json handling in server when there's no response_format
* json: catch schema conversion errors in server
* json: don't complain about unknown format type in server if unset
* json: cleaner build of test
* json: create examples/json-schema-pydantic-example.py
* json: fix date pattern
* json: move json.hpp & json-schema-to-grammar.{cpp,h} to common
* json: indent 4 spaces
* json: fix naming of top-level c++ function (+ drop unused one)
* json: avoid using namespace std
* json: fix zig build
* Update server.feature
* json: iostream -> fprintf
* json: space before & refs for consistency
* json: nits
2024-03-21 11:50:43 +00:00
const convertJSONSchemaGrammar = async () => {
2023-08-14 07:16:54 +00:00
try {
json-schema-to-grammar improvements (+ added to server) (#5978)
* json: fix arrays (disallow `[,1]`)
* json: support tuple types (`[number, string]`)
* json: support additionalProperties (`{[k: string]: [string,number][]}`)
* json: support required / optional properties
* json: add support for pattern
* json: resolve $ref (and support https schema urls)
* json: fix $ref resolution
* join: support union types (mostly for nullable types I think)
* json: support allOf + nested anyOf
* json: support any (`{}` or `{type: object}`)
* json: fix merge
* json: temp fix for escapes
* json: spaces in output and unrestricted output spaces
* json: add typings
* json:fix typo
* Create ts-type-to-grammar.sh
* json: fix _format_literal (json.dumps already escapes quotes)
* json: merge lit sequences and handle negatives
{"type": "string", "pattern": "^({\"question\": \"[^\"]+\", \"response\": \"[^\"]+\"}\\n)+$"}
* json: handle pattern repetitions
* Update json-schema-to-grammar.mjs
* Create regex-to-grammar.py
* json: extract repeated regexp patterns to subrule
* Update json-schema-to-grammar.py
* Update json-schema-to-grammar.py
* Update json-schema-to-grammar.py
* json: handle schema from pydantic Optional fields
* Update json-schema-to-grammar.py
* Update json-schema-to-grammar.py
* Update ts-type-to-grammar.sh
* Update ts-type-to-grammar.sh
* json: simplify nullable fields handling
* json: accept duplicate identical rules
* json: revert space to 1 at most
* json: reuse regexp pattern subrules
* json: handle uuid string format
* json: fix literal escapes
* json: add --allow-fetch
* json: simplify range escapes
* json: support negative ranges in patterns
* Delete commit.txt
* json: custom regex parser, adds dot support & JS-portable
* json: rm trailing spaces
* Update json-schema-to-grammar.mjs
* json: updated server & chat `( cd examples/server && ./deps.sh )`
* json: port fixes from mjs to python
* Update ts-type-to-grammar.sh
* json: support prefixItems alongside array items
* json: add date format + fix uuid
* json: add date, time, date-time formats
* json: preserve order of props from TS defs
* json: port schema converter to C++, wire in ./server
* json: nits
* Update json-schema-to-grammar.cpp
* Update json-schema-to-grammar.cpp
* Update json-schema-to-grammar.cpp
* json: fix mjs implementation + align outputs
* Update json-schema-to-grammar.mjs.hpp
* json: test C++, JS & Python versions
* json: nits + regen deps
* json: cleanup test
* json: revert from c++17 to 11
* json: nit fixes
* json: dirty include for test
* json: fix zig build
* json: pass static command to std::system in tests (fixed temp files)
* json: fix top-level $refs
* json: don't use c++20 designated initializers
* nit
* json: basic support for reserved names `{number:{number:{root:number}}}`
* Revamp test cmake to allow args (WORKING_DIRECTORY needed for JSON test)
* json: re-ran server deps.sh
* json: simplify test
* json: support mix of additional props & required/optional
* json: add tests for some expected failures
* json: fix type=const in c++, add failure expectations for non-str const&enum
* json: test (& simplify output of) empty schema
* json: check parsing in test + fix value & string refs
* json: add server tests for OAI JSON response_format
* json: test/fix top-level anyOf
* json: improve grammar parsing failures
* json: test/fix additional props corner cases
* json: fix string patterns (was missing quotes)
* json: ws nit
* json: fix json handling in server when there's no response_format
* json: catch schema conversion errors in server
* json: don't complain about unknown format type in server if unset
* json: cleaner build of test
* json: create examples/json-schema-pydantic-example.py
* json: fix date pattern
* json: move json.hpp & json-schema-to-grammar.{cpp,h} to common
* json: indent 4 spaces
* json: fix naming of top-level c++ function (+ drop unused one)
* json: avoid using namespace std
* json: fix zig build
* Update server.feature
* json: iostream -> fprintf
* json: space before & refs for consistency
* json: nits
2024-03-21 11:50:43 +00:00
let schema = JSON.parse(params.value.grammar)
const converter = new SchemaConverter({
prop_order: grammarJsonSchemaPropOrder.value
2023-08-14 07:16:54 +00:00
.split(',')
json-schema-to-grammar improvements (+ added to server) (#5978)
* json: fix arrays (disallow `[,1]`)
* json: support tuple types (`[number, string]`)
* json: support additionalProperties (`{[k: string]: [string,number][]}`)
* json: support required / optional properties
* json: add support for pattern
* json: resolve $ref (and support https schema urls)
* json: fix $ref resolution
* join: support union types (mostly for nullable types I think)
* json: support allOf + nested anyOf
* json: support any (`{}` or `{type: object}`)
* json: fix merge
* json: temp fix for escapes
* json: spaces in output and unrestricted output spaces
* json: add typings
* json:fix typo
* Create ts-type-to-grammar.sh
* json: fix _format_literal (json.dumps already escapes quotes)
* json: merge lit sequences and handle negatives
{"type": "string", "pattern": "^({\"question\": \"[^\"]+\", \"response\": \"[^\"]+\"}\\n)+$"}
* json: handle pattern repetitions
* Update json-schema-to-grammar.mjs
* Create regex-to-grammar.py
* json: extract repeated regexp patterns to subrule
* Update json-schema-to-grammar.py
* Update json-schema-to-grammar.py
* Update json-schema-to-grammar.py
* json: handle schema from pydantic Optional fields
* Update json-schema-to-grammar.py
* Update json-schema-to-grammar.py
* Update ts-type-to-grammar.sh
* Update ts-type-to-grammar.sh
* json: simplify nullable fields handling
* json: accept duplicate identical rules
* json: revert space to 1 at most
* json: reuse regexp pattern subrules
* json: handle uuid string format
* json: fix literal escapes
* json: add --allow-fetch
* json: simplify range escapes
* json: support negative ranges in patterns
* Delete commit.txt
* json: custom regex parser, adds dot support & JS-portable
* json: rm trailing spaces
* Update json-schema-to-grammar.mjs
* json: updated server & chat `( cd examples/server && ./deps.sh )`
* json: port fixes from mjs to python
* Update ts-type-to-grammar.sh
* json: support prefixItems alongside array items
* json: add date format + fix uuid
* json: add date, time, date-time formats
* json: preserve order of props from TS defs
* json: port schema converter to C++, wire in ./server
* json: nits
* Update json-schema-to-grammar.cpp
* Update json-schema-to-grammar.cpp
* Update json-schema-to-grammar.cpp
* json: fix mjs implementation + align outputs
* Update json-schema-to-grammar.mjs.hpp
* json: test C++, JS & Python versions
* json: nits + regen deps
* json: cleanup test
* json: revert from c++17 to 11
* json: nit fixes
* json: dirty include for test
* json: fix zig build
* json: pass static command to std::system in tests (fixed temp files)
* json: fix top-level $refs
* json: don't use c++20 designated initializers
* nit
* json: basic support for reserved names `{number:{number:{root:number}}}`
* Revamp test cmake to allow args (WORKING_DIRECTORY needed for JSON test)
* json: re-ran server deps.sh
* json: simplify test
* json: support mix of additional props & required/optional
* json: add tests for some expected failures
* json: fix type=const in c++, add failure expectations for non-str const&enum
* json: test (& simplify output of) empty schema
* json: check parsing in test + fix value & string refs
* json: add server tests for OAI JSON response_format
* json: test/fix top-level anyOf
* json: improve grammar parsing failures
* json: test/fix additional props corner cases
* json: fix string patterns (was missing quotes)
* json: ws nit
* json: fix json handling in server when there's no response_format
* json: catch schema conversion errors in server
* json: don't complain about unknown format type in server if unset
* json: cleaner build of test
* json: create examples/json-schema-pydantic-example.py
* json: fix date pattern
* json: move json.hpp & json-schema-to-grammar.{cpp,h} to common
* json: indent 4 spaces
* json: fix naming of top-level c++ function (+ drop unused one)
* json: avoid using namespace std
* json: fix zig build
* Update server.feature
* json: iostream -> fprintf
* json: space before & refs for consistency
* json: nits
2024-03-21 11:50:43 +00:00
.reduce((acc, cur, i) => ({ ...acc, [cur.trim()]: i }), {}),
allow_fetch: true,
})
schema = await converter.resolveRefs(schema, 'input')
2023-08-14 07:16:54 +00:00
converter.visit(schema, '')
params.value = {
...params.value,
grammar: converter.formatGrammar(),
}
} catch (e) {
alert(`Convert failed: ${e.message}`)
}
}
2023-10-22 19:53:08 +00:00
const FloatField = ({ label, max, min, name, step, value }) => {
2023-07-24 14:54:22 +00:00
return html`
< div >
< label for = "${name}" > ${label}< / label >
< input type = "range" id = "${name}" min = "${min}" max = "${max}" step = "${step}" name = "${name}" value = "${value}" oninput = ${updateParamsFloat} / >
< span > ${value}< / span >
< / div >
`
};
2023-10-22 19:53:08 +00:00
const IntField = ({ label, max, min, name, value }) => {
2023-07-24 14:54:22 +00:00
return html`
< div >
< label for = "${name}" > ${label}< / label >
< input type = "range" id = "${name}" min = "${min}" max = "${max}" name = "${name}" value = "${value}" oninput = ${updateParamsInt} / >
< span > ${value}< / span >
< / div >
`
};
2023-07-04 14:05:27 +00:00
2024-04-04 15:03:00 +00:00
const BoolField = ({ label, name, value }) => {
return html`
< div >
< label for = "${name}" > ${label}< / label >
< input type = "checkbox" id = "${name}" name = "${name}" checked = "${value}" onclick = ${updateParamsBool} / >
< / div >
`
};
2023-08-17 23:34:01 +00:00
const userTemplateReset = (e) => {
e.preventDefault();
userTemplateResetToDefaultAndApply()
}
const UserTemplateResetButton = () => {
if (selectedUserTemplate.value.name == 'default') {
return html`
< button disabled > Using default template< / button >
`
}
return html`
< button onclick = ${userTemplateReset} > Reset all to default< / button >
`
};
useEffect(() => {
// autosave template on every change
userTemplateAutosave()
}, [session.value, params.value])
2023-10-12 06:51:53 +00:00
const GrammarControl = () => (
html`
< div >
< label for = "template" > Grammar< / label >
< textarea id = "grammar" name = "grammar" placeholder = "Use gbnf or JSON Schema+convert" value = "${params.value.grammar}" rows = 4 oninput = ${updateParams}/ >
< input type = "text" name = "prop-order" placeholder = "order: prop1,prop2,prop3" oninput = ${updateGrammarJsonSchemaPropOrder} / >
< button type = "button" onclick = ${convertJSONSchemaGrammar} > Convert JSON Schema< / button >
< / div >
`
);
2023-08-17 23:34:01 +00:00
2023-10-12 06:51:53 +00:00
const PromptControlFieldSet = () => (
html`
< fieldset >
< div >
< label htmlFor = "prompt" > Prompt< / label >
< textarea type = "text" name = "prompt" value = "${session.value.prompt}" oninput = ${updateSession}/ >
< / div >
< / fieldset >
`
);
const ChatConfigForm = () => (
html`
${PromptControlFieldSet()}
2023-07-04 14:05:27 +00:00
2023-07-24 14:54:22 +00:00
< fieldset class = "two" >
2023-07-04 14:05:27 +00:00
< div >
< label for = "user" > User name< / label >
< input type = "text" name = "user" value = "${session.value.user}" oninput = ${updateSession} / >
< / div >
< div >
< label for = "bot" > Bot name< / label >
< input type = "text" name = "char" value = "${session.value.char}" oninput = ${updateSession} / >
< / div >
2023-07-24 14:54:22 +00:00
< / fieldset >
2023-07-04 14:05:27 +00:00
2023-07-24 14:54:22 +00:00
< fieldset >
2023-07-04 14:05:27 +00:00
< div >
< label for = "template" > Prompt template< / label >
< textarea id = "template" name = "template" value = "${session.value.template}" rows = 4 oninput = ${updateSession}/ >
< / div >
< div >
< label for = "template" > Chat history template< / label >
< textarea id = "template" name = "historyTemplate" value = "${session.value.historyTemplate}" rows = 1 oninput = ${updateSession}/ >
< / div >
2023-10-12 06:51:53 +00:00
${GrammarControl()}
< / fieldset >
`
2023-10-22 19:53:08 +00:00
);
2023-10-12 06:51:53 +00:00
const CompletionConfigForm = () => (
html`
${PromptControlFieldSet()}
< fieldset > ${GrammarControl()}< / fieldset >
`
);
2023-08-14 07:16:54 +00:00
2023-10-12 06:51:53 +00:00
return html`
< form >
< fieldset class = "two" >
< ${UserTemplateResetButton}/>
2023-08-14 07:16:54 +00:00
< div >
2023-10-12 06:51:53 +00:00
< label class = "slim" > < input type = "radio" name = "type" value = "chat" checked = ${session.value.type = = = " chat " } oninput = ${updateSession} / > Chat< / label >
< label class = "slim" > < input type = "radio" name = "type" value = "completion" checked = ${session.value.type = = = " completion " } oninput = ${updateSession} / > Completion< / label >
2023-08-14 07:16:54 +00:00
< / div >
2023-07-24 14:54:22 +00:00
< / fieldset >
2023-07-04 14:05:27 +00:00
2023-10-12 06:51:53 +00:00
${session.value.type === 'chat' ? ChatConfigForm() : CompletionConfigForm()}
2023-07-24 14:54:22 +00:00
< fieldset class = "two" >
2023-10-22 19:53:08 +00:00
${IntField({ label: "Predictions", max: 2048, min: -1, name: "n_predict", value: params.value.n_predict })}
2023-12-12 10:12:35 +00:00
${FloatField({ label: "Temperature", max: 2.0, min: 0.0, name: "temperature", step: 0.01, value: params.value.temperature })}
2023-10-22 19:53:08 +00:00
${FloatField({ label: "Penalize repeat sequence", max: 2.0, min: 0.0, name: "repeat_penalty", step: 0.01, value: params.value.repeat_penalty })}
${IntField({ label: "Consider N tokens for penalize", max: 2048, min: 0, name: "repeat_last_n", value: params.value.repeat_last_n })}
2024-04-04 15:03:00 +00:00
${BoolField({ label: "Penalize repetition of newlines", name: "penalize_nl", value: params.value.penalize_nl })}
2023-10-22 19:53:08 +00:00
${IntField({ label: "Top-K sampling", max: 100, min: -1, name: "top_k", value: params.value.top_k })}
${FloatField({ label: "Top-P sampling", max: 1.0, min: 0.0, name: "top_p", step: 0.01, value: params.value.top_p })}
2023-11-09 02:00:34 +00:00
${FloatField({ label: "Min-P sampling", max: 1.0, min: 0.0, name: "min_p", step: 0.01, value: params.value.min_p })}
2023-07-04 14:05:27 +00:00
< / fieldset >
2023-07-24 14:54:22 +00:00
< details >
< summary > More options< / summary >
< fieldset class = "two" >
2023-10-22 19:53:08 +00:00
${FloatField({ label: "Typical P", max: 1.0, min: 0.0, name: "typical_p", step: 0.01, value: params.value.typical_p })}
${FloatField({ label: "Presence penalty", max: 1.0, min: 0.0, name: "presence_penalty", step: 0.01, value: params.value.presence_penalty })}
${FloatField({ label: "Frequency penalty", max: 1.0, min: 0.0, name: "frequency_penalty", step: 0.01, value: params.value.frequency_penalty })}
2024-10-25 16:07:34 +00:00
${FloatField({ label: "DRY Penalty Multiplier", max: 5.0, min: 0.0, name: "dry_multiplier", step: 0.01, value: params.value.dry_multiplier })}
${FloatField({ label: "DRY Base", max: 3.0, min: 1.0, name: "dry_base", step: 0.01, value: params.value.dry_base })}
${IntField({ label: "DRY Allowed Length", max: 10, min: 2, step: 1, name: "dry_allowed_length", value: params.value.dry_allowed_length })}
${IntField({ label: "DRY Penalty Last N", max: 2048, min: -1, step: 16, name: "dry_penalty_last_n", value: params.value.dry_penalty_last_n })}
2024-10-15 10:54:55 +00:00
${FloatField({ label: "XTC probability", max: 1.0, min: 0.0, name: "xtc_probability", step: 0.01, value: params.value.xtc_probability })}
${FloatField({ label: "XTC threshold", max: 0.5, min: 0.0, name: "xtc_threshold", step: 0.01, value: params.value.xtc_threshold })}
2023-07-24 14:54:22 +00:00
< / fieldset >
< hr / >
< fieldset class = "three" >
< div >
< label > < input type = "radio" name = "mirostat" value = "0" checked = ${params.value.mirostat = = 0 } oninput = ${updateParamsInt} / > no Mirostat< / label >
< label > < input type = "radio" name = "mirostat" value = "1" checked = ${params.value.mirostat = = 1 } oninput = ${updateParamsInt} / > Mirostat v1< / label >
< label > < input type = "radio" name = "mirostat" value = "2" checked = ${params.value.mirostat = = 2 } oninput = ${updateParamsInt} / > Mirostat v2< / label >
< / div >
2023-10-22 19:53:08 +00:00
${FloatField({ label: "Mirostat tau", max: 10.0, min: 0.0, name: "mirostat_tau", step: 0.01, value: params.value.mirostat_tau })}
${FloatField({ label: "Mirostat eta", max: 1.0, min: 0.0, name: "mirostat_eta", step: 0.01, value: params.value.mirostat_eta })}
2023-07-24 14:54:22 +00:00
< / fieldset >
2023-08-25 10:32:45 +00:00
< fieldset >
2023-10-22 19:53:08 +00:00
${IntField({ label: "Show Probabilities", max: 10, min: 0, name: "n_probs", value: params.value.n_probs })}
2023-08-25 10:32:45 +00:00
< / fieldset >
2024-02-18 19:11:16 +00:00
< fieldset >
${IntField({ label: "Min Probabilities from each Sampler", max: 10, min: 0, name: "min_keep", value: params.value.min_keep })}
< / fieldset >
2023-12-15 11:49:01 +00:00
< fieldset >
< label for = "api_key" > API Key< / label >
< input type = "text" name = "api_key" value = "${params.value.api_key}" placeholder = "Enter API key" oninput = ${updateParams} / >
< / fieldset >
2023-07-24 14:54:22 +00:00
< / details >
2023-07-04 14:05:27 +00:00
< / form >
`
}
2023-08-25 10:32:45 +00:00
const probColor = (p) => {
const r = Math.floor(192 * (1 - p));
const g = Math.floor(192 * p);
return `rgba(${r},${g},0,0.3)`;
}
const Probabilities = (params) => {
return params.data.map(msg => {
const { completion_probabilities } = msg;
if (
!completion_probabilities ||
completion_probabilities.length === 0
) return msg.content
if (completion_probabilities.length > 1) {
// Not for byte pair
if (completion_probabilities[0].content.startsWith('byte: \\')) return msg.content
const splitData = completion_probabilities.map(prob => ({
content: prob.content,
completion_probabilities: [prob]
}))
return html`< ${Probabilities} data=${splitData} />`
}
const { probs, content } = completion_probabilities[0]
const found = probs.find(p => p.tok_str === msg.content)
const pColor = found ? probColor(found.prob) : 'transparent'
const popoverChildren = html`
< div class = "prob-set" >
${probs.map((p, index) => {
2023-10-22 19:53:08 +00:00
return html`
2023-08-25 10:32:45 +00:00
< div
key=${index}
title=${`prob: ${p.prob}`}
style=${{
2023-10-22 19:53:08 +00:00
padding: '0.3em',
backgroundColor: p.tok_str === content ? probColor(p.prob) : 'transparent'
}}
2023-08-25 10:32:45 +00:00
>
< span > ${p.tok_str}: < / span >
< span > ${Math.floor(p.prob * 100)}%< / span >
< / div >
`
2023-10-22 19:53:08 +00:00
})}
2023-08-25 10:32:45 +00:00
< / div >
`
return html`
< ${Popover} style=${{ backgroundColor: pColor }} popoverChildren=${popoverChildren}>
${msg.content.match(/\n/gim) ? html`< br / > ` : msg.content}
< />
`
});
}
2023-07-05 20:51:13 +00:00
// poor mans markdown replacement
const Markdownish = (params) => {
2024-05-28 04:41:14 +00:00
const chunks = params.text.split('```');
for (let i = 0; i < chunks.length ; i + + ) {
if (i % 2 === 0) { // outside code block
chunks[i] = chunks[i]
.replace(/& /g, '& ')
.replace(/< /g, '< ')
.replace(/>/g, '> ')
.replace(/(^|\n)#{1,6} ([^\n]*)(?=([^`]*`[^`]*`)*[^`]*$)/g, '$1< h3 > $2< / h3 > ')
.replace(/\*\*(.*?)\*\*(?=([^`]*`[^`]*`)*[^`]*$)/g, '< strong > $1< / strong > ')
.replace(/__(.*?)__(?=([^`]*`[^`]*`)*[^`]*$)/g, '< strong > $1< / strong > ')
.replace(/\*(.*?)\*(?=([^`]*`[^`]*`)*[^`]*$)/g, '< em > $1< / em > ')
.replace(/_(.*?)_(?=([^`]*`[^`]*`)*[^`]*$)/g, '< em > $1< / em > ')
.replace(/```.*?\n([\s\S]*?)```/g, '< pre > < code > $1< / code > < / pre > ')
.replace(/`(.*?)`/g, '< code > $1< / code > ')
.replace(/\n/gim, '< br / > ');
} else { // inside code block
chunks[i] = `< pre > < code > ${chunks[i]}< / code > < / pre > `;
}
}
const restoredText = chunks.join('');
return html`< span dangerouslySetInnerHTML = ${{ __html: restoredText } } / > `;
2023-07-05 20:51:13 +00:00
};
const ModelGenerationInfo = (params) => {
if (!llamaStats.value) {
return html`< span / > `
}
return html`
< span >
2024-01-02 15:48:49 +00:00
${llamaStats.value.tokens_predicted} predicted, ${llamaStats.value.tokens_cached} cached, ${llamaStats.value.timings.predicted_per_token_ms.toFixed()}ms per token, ${llamaStats.value.timings.predicted_per_second.toFixed(2)} tokens per second
2023-07-05 20:51:13 +00:00
< / span >
`
}
2023-07-04 14:05:27 +00:00
2024-05-28 04:41:14 +00:00
2023-08-25 10:32:45 +00:00
// simple popover impl
const Popover = (props) => {
const isOpen = useSignal(false);
const position = useSignal({ top: '0px', left: '0px' });
const buttonRef = useRef(null);
const popoverRef = useRef(null);
const togglePopover = () => {
if (buttonRef.current) {
const rect = buttonRef.current.getBoundingClientRect();
position.value = {
top: `${rect.bottom + window.scrollY}px`,
left: `${rect.left + window.scrollX}px`,
};
}
isOpen.value = !isOpen.value;
};
const handleClickOutside = (event) => {
if (popoverRef.current & & !popoverRef.current.contains(event.target) & & !buttonRef.current.contains(event.target)) {
isOpen.value = false;
}
};
useEffect(() => {
document.addEventListener('mousedown', handleClickOutside);
return () => {
document.removeEventListener('mousedown', handleClickOutside);
};
}, []);
return html`
< span style = ${props.style} ref = ${buttonRef} onClick = ${togglePopover} > $ { props . children } < / span >
${isOpen.value & & html`
< ${Portal} into="#portal">
< div
ref=${popoverRef}
class="popover-content"
style=${{
2023-10-22 19:53:08 +00:00
top: position.value.top,
left: position.value.left,
}}
2023-08-25 10:32:45 +00:00
>
${props.popoverChildren}
< / div >
< /${Portal}>
`}
`;
};
// Source: preact-portal (https://github.com/developit/preact-portal/blob/master/src/preact-portal.js)
/** Redirect rendering of descendants into the given CSS selector */
class Portal extends Component {
componentDidUpdate(props) {
for (let i in props) {
if (props[i] !== this.props[i]) {
return setTimeout(this.renderLayer);
}
}
}
componentDidMount() {
this.isMounted = true;
this.renderLayer = this.renderLayer.bind(this);
this.renderLayer();
}
componentWillUnmount() {
this.renderLayer(false);
this.isMounted = false;
if (this.remote & & this.remote.parentNode) this.remote.parentNode.removeChild(this.remote);
}
findNode(node) {
return typeof node === 'string' ? document.querySelector(node) : node;
}
renderLayer(show = true) {
if (!this.isMounted) return;
// clean up old node if moving bases:
if (this.props.into !== this.intoPointer) {
this.intoPointer = this.props.into;
if (this.into & & this.remote) {
this.remote = render(html`< ${PortalProxy} />`, this.into, this.remote);
}
this.into = this.findNode(this.props.into);
}
this.remote = render(html`
< ${PortalProxy} context=${this.context}>
${show & & this.props.children || null}
< /${PortalProxy}>
`, this.into, this.remote);
}
render() {
return null;
}
}
// high-order component that renders its first child if it exists.
// used as a conditional rendering proxy.
class PortalProxy extends Component {
getChildContext() {
return this.props.context;
}
render({ children }) {
return children || null;
}
}
2023-07-04 14:05:27 +00:00
function App(props) {
2024-04-09 08:31:47 +00:00
useEffect(() => {
const query = new URLSearchParams(location.search).get("q");
if (query) chat(query);
}, []);
2023-07-04 14:05:27 +00:00
return html`
2023-10-12 06:51:53 +00:00
< div class = "mode-${session.value.type}" >
2023-07-05 20:51:13 +00:00
< header >
2024-06-01 19:31:48 +00:00
< div class = "grid-container" >
< div class = "grid-item" > < / div >
< div class = "grid-item" > < h1 > llama.cpp< / h1 > < / div >
< div class = "grid-item" > < a class = "customlink" href = "index-new.html" > New UI< / a > < / div >
< / div >
2023-07-05 20:51:13 +00:00
< / header >
< main id = "content" >
< ${chatStarted.value ? ChatLog : ConfigForm} />
< / main >
< section id = "write" >
2023-10-12 06:51:53 +00:00
< ${session.value.type === 'chat' ? MessageInput : CompletionControls} />
2023-07-05 20:51:13 +00:00
< / section >
< footer >
< p > < ${ModelGenerationInfo} />< / p >
< p > Powered by < a href = "https://github.com/ggerganov/llama.cpp" > llama.cpp< / a > and < a href = "https://ggml.ai" > ggml.ai< / a > .< / p >
< / footer >
< / div >
2023-07-04 14:05:27 +00:00
`;
}
2023-08-25 10:32:45 +00:00
render(h(App), document.querySelector('#container'));
2023-07-04 14:05:27 +00:00
< / script >
< / head >
< body >
2023-10-22 19:53:08 +00:00
< div id = "container" >
< input type = "file" id = "fileInput" accept = "image/*" style = "display: none;" >
< / div >
2023-08-25 10:32:45 +00:00
< div id = "portal" > < / div >
2023-07-04 14:05:27 +00:00
< / body >
< / html >