cortexso
/

mixtral

Inference Endpoints

Model card Files Files and versions Community

default

#1

by van-qa - opened Jul 17, 2024

base: refs/heads/main

←

from: refs/pr/1

Discussion Files changed

Files changed (2) hide show

metadata.yml +0 -4
model.yml +1 -1

metadata.yml DELETED Viewed

@@ -1,4 +0,0 @@
-# metadata.yml
-version: 1
-name: mixtral
-default: 7x8b-gguf

model.yml CHANGED Viewed

@@ -15,5 +15,5 @@ stream: true # true | false
 # Engine / Model Settings
 ngl: 33 # Infer from base config.json -> num_attention_heads
 ctx_len: 32768 # Infer from base config.json -> max_position_embeddings
-engine: llama-cpp
 prompt_template: "[INST] {prompt} [/INST]"

 # Engine / Model Settings
 ngl: 33 # Infer from base config.json -> num_attention_heads
 ctx_len: 32768 # Infer from base config.json -> max_position_embeddings
+engine: cortex.llamacpp
 prompt_template: "[INST] {prompt} [/INST]"