diff --git a/inference/models/CodeLlama-7b-hf.yaml b/inference/models/CodeLlama-7b-hf.yaml index c25733f99..57f85ff18 100644 --- a/inference/models/CodeLlama-7b-hf.yaml +++ b/inference/models/CodeLlama-7b-hf.yaml @@ -7,7 +7,7 @@ deepspeed: false workers_per_group: 2 device: "cpu" ipex: - enabled: true + enabled: false precision: bf16 model_description: model_id_or_path: codellama/CodeLlama-7b-hf diff --git a/inference/models/falcon-7b.yaml b/inference/models/falcon-7b.yaml index daf41b523..f4a8ad213 100644 --- a/inference/models/falcon-7b.yaml +++ b/inference/models/falcon-7b.yaml @@ -7,7 +7,7 @@ deepspeed: false workers_per_group: 2 device: "cpu" ipex: - enabled: true + enabled: false precision: bf16 model_description: model_id_or_path: tiiuae/falcon-7b