coyotte508 HF staff commited on
Commit
ad6275a
·
unverified ·
1 Parent(s): bd37ed6

🐛 Stop bigcode prompts (#170)

Browse files
.env CHANGED
@@ -13,6 +13,7 @@ MODELS=`[
13
  "websiteUrl": "https://open-assistant.io",
14
  "userMessageToken": "<|prompter|>",
15
  "assistantMessageToken": "<|assistant|>",
 
16
  "preprompt": "Below are a series of dialogues between various people and an AI assistant. The AI tries to be helpful, polite, honest, sophisticated, emotionally aware, and humble-but-knowledgeable. The assistant is happy to help with almost anything, and will do its best to understand exactly what is needed. It also tries to avoid giving false or misleading information, and it caveats when it isn't entirely sure about the right answer. That said, the assistant is practical and really does its best, and doesn't let caution get too much in the way of being useful.\n-----\n",
17
  "promptExamples": [
18
  {
@@ -33,7 +34,6 @@ MODELS=`[
33
  "top_k": 50,
34
  "truncate": 1000,
35
  "max_new_tokens": 1024,
36
- "stop":["</s>"]
37
  }
38
  },
39
  {
@@ -61,7 +61,8 @@ MODELS=`[
61
  "top_p": 0.9,
62
  "repetition_penalty": 1.2,
63
  "truncate": 8000,
64
- "max_new_tokens": 2000
 
65
  }
66
  }
67
  ]`
 
13
  "websiteUrl": "https://open-assistant.io",
14
  "userMessageToken": "<|prompter|>",
15
  "assistantMessageToken": "<|assistant|>",
16
+ "messageEndToken": "</s>",
17
  "preprompt": "Below are a series of dialogues between various people and an AI assistant. The AI tries to be helpful, polite, honest, sophisticated, emotionally aware, and humble-but-knowledgeable. The assistant is happy to help with almost anything, and will do its best to understand exactly what is needed. It also tries to avoid giving false or misleading information, and it caveats when it isn't entirely sure about the right answer. That said, the assistant is practical and really does its best, and doesn't let caution get too much in the way of being useful.\n-----\n",
18
  "promptExamples": [
19
  {
 
34
  "top_k": 50,
35
  "truncate": 1000,
36
  "max_new_tokens": 1024,
 
37
  }
38
  },
39
  {
 
61
  "top_p": 0.9,
62
  "repetition_penalty": 1.2,
63
  "truncate": 8000,
64
+ "max_new_tokens": 2000,
65
+ "stop": ["Human:", "-----"]
66
  }
67
  }
68
  ]`
src/lib/buildPrompt.ts CHANGED
@@ -17,10 +17,10 @@ export function buildPrompt(
17
  (m.from === "user"
18
  ? model.userMessageToken + m.content
19
  : model.assistantMessageToken + m.content) +
20
- (model.parameters.stop
21
- ? m.content.endsWith(model.parameters.stop[0])
22
  ? ""
23
- : model.parameters.stop[0]
24
  : "")
25
  )
26
  .join("") + model.assistantMessageToken;
 
17
  (m.from === "user"
18
  ? model.userMessageToken + m.content
19
  : model.assistantMessageToken + m.content) +
20
+ (model.messageEndToken
21
+ ? m.content.endsWith(model.messageEndToken)
22
  ? ""
23
+ : model.messageEndToken
24
  : "")
25
  )
26
  .join("") + model.assistantMessageToken;
src/lib/components/chat/ChatMessage.svelte CHANGED
@@ -8,22 +8,32 @@
8
  import IconLoading from "../icons/IconLoading.svelte";
9
  import CarbonRotate360 from "~icons/carbon/rotate-360";
10
  import { PUBLIC_SEP_TOKEN } from "$lib/constants/publicSepToken";
 
11
 
12
  function sanitizeMd(md: string) {
13
- return md
14
  .replace(/<\|[a-z]*$/, "")
15
  .replace(/<\|[a-z]+\|$/, "")
16
  .replace(/<$/, "")
17
  .replaceAll(PUBLIC_SEP_TOKEN, " ")
18
  .replaceAll(/<\|[a-z]+\|>/g, " ")
19
  .replaceAll(/<br\s?\/?>/gi, "\n")
20
- .trim()
21
- .replaceAll("<", "&lt;");
 
 
 
 
 
 
 
 
22
  }
23
  function unsanitizeMd(md: string) {
24
  return md.replaceAll("&lt;", "<");
25
  }
26
 
 
27
  export let message: Message;
28
  export let loading = false;
29
 
 
8
  import IconLoading from "../icons/IconLoading.svelte";
9
  import CarbonRotate360 from "~icons/carbon/rotate-360";
10
  import { PUBLIC_SEP_TOKEN } from "$lib/constants/publicSepToken";
11
+ import type { Model } from "$lib/types/Model";
12
 
13
  function sanitizeMd(md: string) {
14
+ let ret = md
15
  .replace(/<\|[a-z]*$/, "")
16
  .replace(/<\|[a-z]+\|$/, "")
17
  .replace(/<$/, "")
18
  .replaceAll(PUBLIC_SEP_TOKEN, " ")
19
  .replaceAll(/<\|[a-z]+\|>/g, " ")
20
  .replaceAll(/<br\s?\/?>/gi, "\n")
21
+ .replaceAll("<", "&lt;")
22
+ .trim();
23
+
24
+ for (const stop of model.parameters.stop ?? []) {
25
+ if (ret.endsWith(stop)) {
26
+ ret = ret.slice(0, -stop.length).trim();
27
+ }
28
+ }
29
+
30
+ return ret;
31
  }
32
  function unsanitizeMd(md: string) {
33
  return md.replaceAll("&lt;", "<");
34
  }
35
 
36
+ export let model: Model;
37
  export let message: Message;
38
  export let loading = false;
39
 
src/lib/components/chat/ChatMessages.svelte CHANGED
@@ -42,6 +42,7 @@
42
  <ChatMessage
43
  loading={loading && i === messages.length - 1}
44
  {message}
 
45
  on:retry={() => dispatch("retry", { id: message.id, content: message.content })}
46
  />
47
  {:else}
@@ -50,7 +51,10 @@
50
  {/if}
51
  {/each}
52
  {#if pending}
53
- <ChatMessage message={{ from: "assistant", content: "", id: randomUUID() }} />
 
 
 
54
  {/if}
55
  <div class="h-32 flex-none" />
56
  </div>
 
42
  <ChatMessage
43
  loading={loading && i === messages.length - 1}
44
  {message}
45
+ model={currentModel}
46
  on:retry={() => dispatch("retry", { id: message.id, content: message.content })}
47
  />
48
  {:else}
 
51
  {/if}
52
  {/each}
53
  {#if pending}
54
+ <ChatMessage
55
+ message={{ from: "assistant", content: "", id: randomUUID() }}
56
+ model={currentModel}
57
+ />
58
  {/if}
59
  <div class="h-32 flex-none" />
60
  </div>
src/lib/server/models.ts CHANGED
@@ -10,6 +10,7 @@ const modelsRaw = z
10
  datasetName: z.string().min(1).optional(),
11
  userMessageToken: z.string().min(1),
12
  assistantMessageToken: z.string().min(1),
 
13
  preprompt: z.string().default(""),
14
  prepromptUrl: z.string().url().optional(),
15
  promptExamples: z
@@ -34,7 +35,7 @@ const modelsRaw = z
34
  temperature: z.number().min(0).max(1),
35
  truncate: z.number().int().positive(),
36
  max_new_tokens: z.number().int().positive(),
37
- stop: z.array(z.string()).min(1).optional(),
38
  })
39
  .passthrough(),
40
  })
 
10
  datasetName: z.string().min(1).optional(),
11
  userMessageToken: z.string().min(1),
12
  assistantMessageToken: z.string().min(1),
13
+ messageEndToken: z.string().min(1).optional(),
14
  preprompt: z.string().default(""),
15
  prepromptUrl: z.string().url().optional(),
16
  promptExamples: z
 
35
  temperature: z.number().min(0).max(1),
36
  truncate: z.number().int().positive(),
37
  max_new_tokens: z.number().int().positive(),
38
+ stop: z.array(z.string()).optional(),
39
  })
40
  .passthrough(),
41
  })
src/lib/types/Model.ts CHANGED
@@ -1,7 +1,6 @@
1
- export interface Model {
2
- name: string;
3
- displayName?: string;
4
- websiteUrl?: string;
5
- datasetName?: string;
6
- promptExamples?: Array<{ title: string; prompt: string }>;
7
- }
 
1
+ import type { BackendModel } from "$lib/server/models";
2
+
3
+ export type Model = Pick<
4
+ BackendModel,
5
+ "name" | "displayName" | "websiteUrl" | "datasetName" | "promptExamples" | "parameters"
6
+ >;
 
src/routes/+layout.server.ts CHANGED
@@ -33,8 +33,7 @@ export const load: LayoutServerLoad = async ({ locals, depends, url }) => {
33
  settings: {
34
  shareConversationsWithModelAuthors: settings?.shareConversationsWithModelAuthors ?? true,
35
  ethicsModalAcceptedAt: settings?.ethicsModalAcceptedAt ?? null,
36
- activeModel:
37
- url.searchParams.get("model") ?? settings?.activeModel ?? defaultModel.name,
38
  },
39
  models: models.map((model) => ({
40
  name: model.name,
 
33
  settings: {
34
  shareConversationsWithModelAuthors: settings?.shareConversationsWithModelAuthors ?? true,
35
  ethicsModalAcceptedAt: settings?.ethicsModalAcceptedAt ?? null,
36
+ activeModel: url.searchParams.get("model") ?? settings?.activeModel ?? defaultModel.name,
 
37
  },
38
  models: models.map((model) => ({
39
  name: model.name,
src/routes/conversation/[id]/+server.ts CHANGED
@@ -107,7 +107,16 @@ export async function POST({ request, fetch, locals, params }) {
107
  generated_text = generated_text.slice(prompt.length);
108
  }
109
 
110
- generated_text = trimSuffix(trimPrefix(generated_text, "<|startoftext|>"), PUBLIC_SEP_TOKEN);
 
 
 
 
 
 
 
 
 
111
 
112
  messages.push({ from: "assistant", content: generated_text, id: crypto.randomUUID() });
113
 
 
107
  generated_text = generated_text.slice(prompt.length);
108
  }
109
 
110
+ generated_text = trimSuffix(
111
+ trimPrefix(generated_text, "<|startoftext|>"),
112
+ PUBLIC_SEP_TOKEN
113
+ ).trim();
114
+
115
+ for (const stop of modelInfo?.parameters?.stop ?? []) {
116
+ if (generated_text.endsWith(stop)) {
117
+ generated_text = generated_text.slice(0, -stop.length).trim();
118
+ }
119
+ }
120
 
121
  messages.push({ from: "assistant", content: generated_text, id: crypto.randomUUID() });
122