Skip to content

Commit

Permalink
[Model] Add gemm-2-2b-jpn-it (#594)
Browse files Browse the repository at this point in the history
Add the following model to prebuilt model ID:
- `gemma-2-2b-jpn-it-q4f16_1-MLC`
- `gemma-2-2b-jpn-it-q4f32_1-MLC`

See mlc-ai/binary-mlc-llm-libs#143.
  • Loading branch information
CharlieFRuan authored Oct 4, 2024
1 parent 4d8f63a commit b1160e3
Showing 1 changed file with 28 additions and 0 deletions.
28 changes: 28 additions & 0 deletions src/config.ts
Original file line number Diff line number Diff line change
Expand Up @@ -963,6 +963,34 @@ export const prebuiltAppConfig: AppConfig = {
context_window_size: 4096,
},
},
// Gemma2-2b-jpn
{
model: "https://huggingface.co/mlc-ai/gemma-2-2b-jpn-it-q4f16_1-MLC",
model_id: "gemma-2-2b-jpn-it-q4f16_1-MLC",
model_lib:
modelLibURLPrefix +
modelVersion +
"/gemma-2-2b-jpn-it-q4f16_1-ctx4k_cs1k-webgpu.wasm",
vram_required_MB: 1895.3,
low_resource_required: true,
required_features: ["shader-f16"],
overrides: {
context_window_size: 4096,
},
},
{
model: "https://huggingface.co/mlc-ai/gemma-2-2b-jpn-it-q4f32_1-MLC",
model_id: "gemma-2-2b-jpn-it-q4f32_1-MLC",
model_lib:
modelLibURLPrefix +
modelVersion +
"/gemma-2-2b-jpn-it-q4f32_1-ctx4k_cs1k-webgpu.wasm",
vram_required_MB: 2508.75,
low_resource_required: true,
overrides: {
context_window_size: 4096,
},
},
// Qwen-2
{
model: "https://huggingface.co/mlc-ai/Qwen2.5-0.5B-Instruct-q4f16_1-MLC",
Expand Down

0 comments on commit b1160e3

Please sign in to comment.