Skip to content

Commit e97d1bc

Browse files
author
Judd
committed
more quantized models
1 parent d4a624c commit e97d1bc

File tree

1 file changed

+82
-0
lines changed

1 file changed

+82
-0
lines changed

scripts/models.json

Lines changed: 82 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,86 @@
11
{
2+
"glm-4": {
3+
"brief": "GLM-4-9B is the open-source version of the latest generation of pre-trained models in the GLM-4 series launched by Zhipu AI.",
4+
"default": "9b",
5+
"license": "https://huggingface.co/THUDM/glm-4-9b/blob/main/LICENSE",
6+
"variants": {
7+
"9b": {
8+
"default": "q8",
9+
"quantized": {
10+
"q8": {
11+
"size": 9993306576,
12+
"url": "chatllm_quantized_glm/glm4.bin"
13+
}
14+
}
15+
}
16+
}
17+
},
18+
"chatglm3": {
19+
"brief": "ChatGLM3 is a generation of pre-trained dialogue models jointly released by Zhipu AI and Tsinghua KEG.",
20+
"default": "6b",
21+
"license": "https://github.com/THUDM/ChatGLM3/blob/main/MODEL_LICENSE",
22+
"variants": {
23+
"6b": {
24+
"default": "q8",
25+
"quantized": {
26+
"q8": {
27+
"size": 6635798992,
28+
"url": "chatllm_quantized_glm/chatglm3-6b.bin"
29+
}
30+
}
31+
}
32+
}
33+
},
34+
"chatglm2": {
35+
"brief": "ChatGLM2-6B is the second-generation version of the open-source bilingual (Chinese-English) chat model ChatGLM-6B.",
36+
"default": "6b",
37+
"license": "https://github.com/THUDM/ChatGLM2-6B/blob/main/MODEL_LICENSE",
38+
"variants": {
39+
"6b": {
40+
"default": "q8",
41+
"quantized": {
42+
"q8": {
43+
"size": 6635798992,
44+
"url": "chatllm_quantized_glm/chatglm2.bin"
45+
}
46+
}
47+
}
48+
}
49+
},
50+
"phi3": {
51+
"brief": "Phi-3 is a family of lightweight 3B (Mini) and 14B (Medium) state-of-the-art open models by Microsoft.",
52+
"default": "mini-4k",
53+
"license": "MIT",
54+
"variants": {
55+
"mini-4k": {
56+
"default": "q8",
57+
"quantized": {
58+
"q8": {
59+
"size": 4060935568,
60+
"url": "chatllm_quantized_phi3/phi3-mini-4k.bin"
61+
}
62+
}
63+
},
64+
"mini-128k": {
65+
"default": "q8",
66+
"quantized": {
67+
"q8": {
68+
"size": 4060936592,
69+
"url": "chatllm_quantized_phi3/phi3-mini-128k.bin"
70+
}
71+
}
72+
},
73+
"medium-128k": {
74+
"default": "q4_1",
75+
"quantized": {
76+
"q4_1": {
77+
"size": 8727005584,
78+
"url": "chatllm_quantized_phi3/phi3-medium-128k_q4_1.bin"
79+
}
80+
}
81+
}
82+
}
83+
},
284
"yi-1.5": {
385
"brief": "Yi 1.5 is a high-performing, bilingual language model.",
486
"default": "6b",

0 commit comments

Comments
 (0)