more models

Judd · Judd · commit d4a624c87b51 · 2024-06-23T08:06:36.000+08:00
diff --git a/scripts/model_downloader.py b/scripts/model_downloader.py
@@ -51,7 +51,7 @@ def show_model(m):
         show_variants(info['variants'], info['default'])
         print()
 
-    for m in all_models.keys():
+    for m in sorted(all_models.keys()):
         show_model(m)
 
 def parse_model_id(model_id: str):
diff --git a/scripts/models.json b/scripts/models.json
@@ -1,4 +1,156 @@
 {
+    "yi-1.5": {
+        "brief": "Yi 1.5 is a high-performing, bilingual language model.",
+        "default": "6b",
+        "license": "Apache License Version 2.0",
+        "variants": {
+            "6b": {
+                "default": "q8",
+                "quantized": {
+                    "q8": {
+                        "size": 6441564880,
+                        "url": "chatllm_quantized_yi1.5/yi1.5-6b.bin"
+                    }
+                }
+            },
+            "9b": {
+                "default": "q8",
+                "quantized": {
+                    "q8": {
+                        "size": 9383354064,
+                        "url": "chatllm_quantized_yi1.5/yi1.5-9b.bin"
+                    }
+                }
+            },
+            "9b-16k": {
+                "default": "q4_1",
+                "quantized": {
+                    "q4_1": {
+                        "size": 5520662224,
+                        "url": "chatllm_quantized_yi1.5/yi1.5-9b-16k_q4_1.bin"
+                    }
+                }
+            }
+        }
+    },
+    "deepseek-v2": {
+        "brief": "A strong, economical, and efficient Mixture-of-Experts language model.",
+        "default": "light",
+        "license": "DEEPSEEK LICENSE AGREEMENT Version 1.0, 23 October 2023",
+        "variants": {
+            "light": {
+                "default": "q8",
+                "quantized": {
+                    "q8": {
+                        "size": 16691737872,
+                        "url": "chatllm_quantized_deepseek/deepseekv2-lite.bin"
+                    }
+                }
+            }
+        }
+    },
+    "deepseek-coder-v2": {
+        "brief": "An open-source Mixture-of-Experts code language model that achieves performance comparable to GPT4-Turbo in code-specific tasks.",
+        "default": "light",
+        "license": "DEEPSEEK LICENSE AGREEMENT Version 1.0, 23 October 2023",
+        "variants": {
+            "light": {
+                "default": "q4_1",
+                "quantized": {
+                    "q8": {
+                        "size": 16691738304,
+                        "url": "chatllm_quantized_deepseek/deepseek-coder-v2-lite-instruct.bin"
+                    },
+                    "q4_1": {
+                        "size": 9820206784,
+                        "url": "chatllm_quantized_deepseek/deepseek-coder-v2-lite-instruct_q4_1.bin"
+                    }
+                }
+            }
+        }
+    },
+    "deepseek-coder-v2-base": {
+        "brief": "An open-source Mixture-of-Experts code language model that achieves performance comparable to GPT4-Turbo in code-specific tasks.",
+        "default": "light",
+        "license": "DEEPSEEK LICENSE AGREEMENT Version 1.0, 23 October 2023",
+        "variants": {
+            "light": {
+                "default": "q4_1",
+                "quantized": {
+                    "q4_1": {
+                        "size": 9820206784,
+                        "url": "chatllm_quantized_deepseek/deepseek-coder-v2-lite-base_q4_1.bin"
+                    }
+                }
+            }
+        }
+    },
+    "deepseek-llm": {
+        "brief": "An advanced language model crafted with 2 trillion bilingual tokens.",
+        "default": "7b",
+        "license": "DEEPSEEK LICENSE AGREEMENT Version 1.0, 23 October 2023",
+        "variants": {
+            "7b": {
+                "default": "q8",
+                "quantized": {
+                    "q8": {
+                        "size": 7345830176,
+                        "url": "chatllm_quantized_deepseek/deepseek-7b.bin"
+                    }
+                }
+            }
+        }
+    },
+    "deepseek-coder": {
+        "brief": "DeepSeek Coder is a capable coding model trained on two trillion code and natural language tokens.",
+        "default": "1.3b",
+        "license": "DEEPSEEK LICENSE AGREEMENT Version 1.0, 23 October 2023",
+        "variants": {
+            "1.3b": {
+                "default": "q8",
+                "quantized": {
+                    "q8": {
+                        "size": 1431733904,
+                        "url": "chatllm_quantized_deepseek/deepseekcoder-1.3b.bin"
+                    }
+                }
+            },
+            "7b": {
+                "default": "q8",
+                "quantized": {
+                    "q8": {
+                        "size": 7163394192,
+                        "url": "chatllm_quantized_deepseek/deepseekcoder-7b.bin"
+                    }
+                }
+            }
+        }
+    },
+    "deepseek-coder-base": {
+        "brief": "DeepSeek Coder is a capable coding model trained on two trillion code and natural language tokens.",
+        "default": "1.3b",
+        "license": "DEEPSEEK LICENSE AGREEMENT Version 1.0, 23 October 2023",
+        "variants": {
+            "1.3b": {
+                "default": "q8",
+                "quantized": {
+                    "q8": {
+                        "size": 1431733904,
+                        "url": "chatllm_quantized_deepseek/deepseekcoder-1.3b-base.bin"
+                    }
+                }
+            },
+            "6.7b": {
+                "default": "q8",
+                "quantized": {
+                    "q8": {
+                        "size": 7163394192,
+                        "url": "chatllm_quantized_deepseek/deepseekcoder-6.7b-base.bin"
+                    }
+                }
+            }
+        }
+    },
     "gemma": {
         "brief": "Gemma is a family of lightweight, state-of-the-art open models built by Google DeepMind. Updated to version 1.1.",
         "default": "2b",
@@ -25,7 +177,27 @@
                 "quantized": {
                     "q4_1": {
                         "size": 5025629392,
-                        "url": "chatllm_quantized_models/llama3-8b-q4_1.bin"
+                        "url": "chatllm_quantized_llama3/llama3-8b-q4_1.bin"
+                    },
+                    "q8": {
+                        "size": 8538752208,
+                        "url": "chatllm_quantized_llama3/llama3-8b.bin"
+                    }
+                }
+            }
+        }
+    },
+    "llama3-chinese-lora": {
+        "brief": "Llama-3-Chinese-8B-Instruct-LoRA, which is further tuned with 5M instruction data on Llama-3-Chinese-8B.",
+        "default": "8b",
+        "license": "",
+        "variants": {
+            "8b": {
+                "default": "q4_0",
+                "quantized": {
+                    "q4_0": {
+                        "size": 4523754704,
+                        "url": "chatllm_quantized_llama3/llama3-8b-lora-q4_0.bin"
                     }
                 }
             }