Skip to content

Commit

Permalink
Add 4-bit MLX of Llama 3.3 model.
Browse files Browse the repository at this point in the history
  • Loading branch information
dadmobile committed Dec 12, 2024
1 parent 9f64e3e commit bb3f563
Showing 1 changed file with 27 additions and 0 deletions.
27 changes: 27 additions & 0 deletions transformerlab/galleries/model-gallery.json
Original file line number Diff line number Diff line change
Expand Up @@ -1264,6 +1264,33 @@
"paperUrl": "?"
}
},
{
"uniqueID": "mlx-community/Llama-3.3-70B-Instruct-4bit",
"name": "Llama-3.3-70B-Instruct-4bit",
"description": "MLX export of Llama 3.3 70B Instruct model quantized to 4 bit. Loses some quality but useful for systems with lower RAM.",
"parameters": "70B",
"context": "131072",
"architecture": "LlamaForCausalLM",
"formats": [
"Safetensors"
],
"huggingface_repo": "mlx-community/Llama-3.3-70B-Instruct-4bit",
"transformers_version": "4.47.0.dev0",
"gated": false,
"license": "llama3.3",
"logo": "https://upload.wikimedia.org/wikipedia/commons/a/ab/Meta-Logo.png",
"size_of_model_in_mb": 37866.6,
"author": {
"name": "mlx-community",
"url": "https://huggingface.co/mlx-community/Llama-3.3-70B-Instruct-4bit",
"blurb": ""
},
"resources": {
"canonicalUrl": "https://huggingface.co/mlx-community/Llama-3.3-70B-Instruct-4bit",
"downloadUrl": "https://huggingface.co/mlx-community/Llama-3.3-70B-Instruct-4bit",
"paperUrl": "?"
}
},
{
"uniqueID": "Qwen/Qwen2-7B-Instruct",
"name": "Qwen2 7B Instruct",
Expand Down

0 comments on commit bb3f563

Please sign in to comment.