Add Llama 3.1 (#98)
* Update Mistral 7B config * Add Mistral NeMo * Update for Llama 3.1 * Align LlamaConfiguration with Python implementation * Fix model configuration names * Refine DynamicNTKScalingRoPE * compute base only once --------- Co-authored-by: Awni Hannun <awni@apple.com>
This commit is contained in:
@@ -151,7 +151,7 @@ extension ModelConfiguration {
|
||||
defaultPrompt: "Why is the sky blue?"
|
||||
)
|
||||
|
||||
public static let phi34bit = ModelConfiguration(
|
||||
public static let phi3_4bit = ModelConfiguration(
|
||||
id: "mlx-community/Phi-3-mini-4k-instruct-4bit-no-q-embed",
|
||||
defaultPrompt: "what is the gravity on mars and the moon?",
|
||||
extraEOSTokens: ["<|end|>"]
|
||||
@@ -199,9 +199,17 @@ extension ModelConfiguration {
|
||||
"\(prompt)"
|
||||
}
|
||||
|
||||
public static let llama38B4bit = ModelConfiguration(
|
||||
public static let llama3_1_8B_4bit = ModelConfiguration(
|
||||
id: "mlx-community/Meta-Llama-3.1-8B-Instruct-4bit",
|
||||
defaultPrompt: "What is the difference between a fruit and a vegetable?"
|
||||
) {
|
||||
prompt in
|
||||
"<|begin_of_text|><|start_header_id|>system<|end_header_id|>\nYou are a helpful assistant<|eot_id|>\n<|start_header_id|>user<|end_header_id|>\n\(prompt)<|eot_id|>\n<|start_header_id|>assistant<|end_header_id|>"
|
||||
}
|
||||
|
||||
public static let llama3_8B_4bit = ModelConfiguration(
|
||||
id: "mlx-community/Meta-Llama-3-8B-Instruct-4bit",
|
||||
defaultPrompt: "what is the difference between a fruit and a vegetable?"
|
||||
defaultPrompt: "What is the difference between a fruit and a vegetable?"
|
||||
) {
|
||||
prompt in
|
||||
"<|begin_of_text|><|start_header_id|>system<|end_header_id|>\nYou are a helpful assistant<|eot_id|>\n<|start_header_id|>user<|end_header_id|>\n\(prompt)<|eot_id|>\n<|start_header_id|>assistant<|end_header_id|>"
|
||||
@@ -220,12 +228,13 @@ extension ModelConfiguration {
|
||||
case .idle:
|
||||
bootstrapState = .bootstrapping
|
||||
register(configurations: [
|
||||
llama3_1_8B_4bit,
|
||||
mistralNeMo4bit,
|
||||
smolLM_135M_4bit,
|
||||
mistral7B4bit,
|
||||
codeLlama13b4bit,
|
||||
phi4bit,
|
||||
phi34bit,
|
||||
phi3_4bit,
|
||||
gemma2bQuantized,
|
||||
gemma_2_9b_it_4bit,
|
||||
qwen205b4bit,
|
||||
|
||||
Reference in New Issue
Block a user