Skip to content

Commit

Permalink
fix model id for llama 3.1 405b now its finally on the hub
Browse files Browse the repository at this point in the history
  • Loading branch information
AlexCheema committed Jul 31, 2024
1 parent 178fb75 commit 94ac946
Showing 1 changed file with 1 addition and 1 deletion.
2 changes: 1 addition & 1 deletion exo/api/chatgpt_api.py
Original file line number Diff line number Diff line change
Expand Up @@ -21,7 +21,7 @@
"MLXDynamicShardInferenceEngine": Shard(model_id="mlx-community/Meta-Llama-3.1-70B-Instruct-4bit", start_layer=0, end_layer=0, n_layers=80),
},
"llama-3.1-405b": {
"MLXDynamicShardInferenceEngine": Shard(model_id="/Users/alex/405b-instruct-4bit", start_layer=0, end_layer=0, n_layers=126),
"MLXDynamicShardInferenceEngine": Shard(model_id="mlx-community/Meta-Llama-3.1-405B-4bit", start_layer=0, end_layer=0, n_layers=126),
},
"llama-3-8b": {
"MLXDynamicShardInferenceEngine": Shard(model_id="mlx-community/Meta-Llama-3-8B-Instruct-4bit", start_layer=0, end_layer=0, n_layers=32),
Expand Down

0 comments on commit 94ac946

Please sign in to comment.