diff --git a/aio/cpu/text-to-text.yaml b/aio/cpu/text-to-text.yaml index aeb3c842..d30f403e 100644 --- a/aio/cpu/text-to-text.yaml +++ b/aio/cpu/text-to-text.yaml @@ -41,6 +41,7 @@ f16: true stopwords: - <|im_end|> - +- "\n" usage: | curl http://localhost:8080/v1/chat/completions -H "Content-Type: application/json" -d '{ "model": "gpt-4", diff --git a/aio/gpu-8g/text-to-text.yaml b/aio/gpu-8g/text-to-text.yaml index 1a67169b..1645a257 100644 --- a/aio/gpu-8g/text-to-text.yaml +++ b/aio/gpu-8g/text-to-text.yaml @@ -41,6 +41,7 @@ f16: true stopwords: - <|im_end|> - +- "\n" usage: | curl http://localhost:8080/v1/chat/completions -H "Content-Type: application/json" -d '{ "model": "gpt-4", diff --git a/aio/intel/text-to-text.yaml b/aio/intel/text-to-text.yaml index 0577d19b..3f3d2c39 100644 --- a/aio/intel/text-to-text.yaml +++ b/aio/intel/text-to-text.yaml @@ -40,6 +40,7 @@ template: context_size: 4096 stopwords: - <|im_end|> +- "\n" - usage: | curl http://localhost:8080/v1/chat/completions -H "Content-Type: application/json" -d '{ diff --git a/embedded/models/hermes-2-pro-mistral.yaml b/embedded/models/hermes-2-pro-mistral.yaml index 108216f5..3792be78 100644 --- a/embedded/models/hermes-2-pro-mistral.yaml +++ b/embedded/models/hermes-2-pro-mistral.yaml @@ -41,6 +41,7 @@ f16: true stopwords: - <|im_end|> - +- "\n" usage: | curl http://localhost:8080/v1/chat/completions -H "Content-Type: application/json" -d '{ "model": "hermes-2-pro-mistral",