Text Generation
Transformers
Safetensors
GGUF
English
Inference Endpoints
leafspark commited on
Commit
ebad837
·
verified ·
1 Parent(s): 8cf2c37

Upload 2 files

Browse files
.gitattributes CHANGED
@@ -41,3 +41,4 @@ chk-wikichat-256x28-8590.gguf filter=lfs diff=lfs merge=lfs -text
41
  ggml-wikichat-256x28-f32-8590.gguf filter=lfs diff=lfs merge=lfs -text
42
  ggml-wikichat-256x28-f32-9580.gguf filter=lfs diff=lfs merge=lfs -text
43
  ggml-wikichat-256x28-f32-9590-4k.gguf filter=lfs diff=lfs merge=lfs -text
 
 
41
  ggml-wikichat-256x28-f32-8590.gguf filter=lfs diff=lfs merge=lfs -text
42
  ggml-wikichat-256x28-f32-9580.gguf filter=lfs diff=lfs merge=lfs -text
43
  ggml-wikichat-256x28-f32-9590-4k.gguf filter=lfs diff=lfs merge=lfs -text
44
+ chk-wikichat-256x28-9590-4k.gguf filter=lfs diff=lfs merge=lfs -text
chk-wikichat-256x28-9590-4k.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48e91edc878fa54b434c572e96f7a370e373f98f5105bee73a4704184b6abb68
3
+ size 483790912
model_config_4k.json ADDED
@@ -0,0 +1,53 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "WikiGGML4k",
3
+ "load_params": {
4
+ "n_ctx": 4096,
5
+ "n_batch": 512,
6
+ "rope_freq_base": 0,
7
+ "rope_freq_scale": 0,
8
+ "n_gpu_layers": -1,
9
+ "use_mlock": true,
10
+ "main_gpu": 0,
11
+ "tensor_split": [
12
+ 0
13
+ ],
14
+ "seed": -1,
15
+ "f16_kv": true,
16
+ "use_mmap": true,
17
+ "no_kv_offload": false,
18
+ "num_experts_used": 0
19
+ },
20
+ "inference_params": {
21
+ "n_threads": 4,
22
+ "n_predict": -1,
23
+ "top_k": 40,
24
+ "min_p": 0.05,
25
+ "top_p": 0.95,
26
+ "temp": 0.8,
27
+ "repeat_penalty": 1.1,
28
+ "input_prefix": "User:",
29
+ "input_suffix": "\nA:",
30
+ "antiprompt": [
31
+ "### Instruction:",
32
+ "### User:\\n",
33
+ "User:\\n"
34
+ ],
35
+ "pre_prompt": "Below is an instruction that describes a task. Write a response that appropriately completes the request.",
36
+ "pre_prompt_suffix": "\\n",
37
+ "pre_prompt_prefix": "",
38
+ "seed": -1,
39
+ "tfs_z": 1,
40
+ "typical_p": 1,
41
+ "repeat_last_n": 64,
42
+ "frequency_penalty": 0,
43
+ "presence_penalty": 0,
44
+ "n_keep": 0,
45
+ "logit_bias": {},
46
+ "mirostat": 0,
47
+ "mirostat_tau": 5,
48
+ "mirostat_eta": 0.1,
49
+ "memory_f16": true,
50
+ "multiline_input": false,
51
+ "penalize_nl": true
52
+ }
53
+ }