From e0ef9e2bb99900f29fb8d73f07e66b478542713c Mon Sep 17 00:00:00 2001 From: Ettore Di Giacinto Date: Thu, 16 May 2024 20:05:20 +0200 Subject: [PATCH] models(gallery): add yi 6/9b, sqlcoder, sfr-iterative-dpo (#2335) Signed-off-by: Ettore Di Giacinto --- gallery/chatml.yaml | 20 +++++++------- gallery/index.yaml | 63 +++++++++++++++++++++++++++++++++++++++++++++ 2 files changed, 72 insertions(+), 11 deletions(-) diff --git a/gallery/chatml.yaml b/gallery/chatml.yaml index e27fdab8bfb8..2d4effe8f553 100644 --- a/gallery/chatml.yaml +++ b/gallery/chatml.yaml @@ -6,18 +6,17 @@ config_file: | template: chat_message: | <|im_start|>{{ .RoleName }} - {{- if .FunctionCall }} + {{ if .FunctionCall -}} Function call: - {{- else if eq .RoleName "tool" }} + {{ else if eq .RoleName "tool" -}} Function response: - {{- end }} - {{- if .Content}} + {{ end -}} + {{ if .Content -}} {{.Content }} - {{- end }} - {{- if .FunctionCall}} + {{ end -}} + {{ if .FunctionCall -}} {{toJson .FunctionCall}} - {{- end }} - <|im_end|> + {{ end -}}<|im_end|> function: | <|im_start|>system You are a function calling AI model. You are provided with functions to execute. You may call one or more functions to assist with the user query. Don't make assumptions about what values to plug into functions. Here are the available tools: @@ -28,7 +27,6 @@ config_file: | <|im_end|> {{.Input -}} <|im_start|>assistant - chat: | {{.Input -}} <|im_start|>assistant @@ -37,5 +35,5 @@ config_file: | context_size: 4096 f16: true stopwords: - - <|im_end|> - - + - '<|im_end|>' + - '' diff --git a/gallery/index.yaml b/gallery/index.yaml index c43ce3b8aecb..ee84169e0065 100644 --- a/gallery/index.yaml +++ b/gallery/index.yaml @@ -613,6 +613,35 @@ - filename: v2-Llama-3-Lumimaid-8B-v0.1-OAS-Q4_K_M-imat.gguf sha256: b00b4cc2ea4e06db592e5f581171758387106626bcbf445c03a1cb7b424be881 uri: huggingface://Lewdiculous/Llama-3-Lumimaid-8B-v0.1-OAS-GGUF-IQ-Imatrix/v2-Llama-3-Lumimaid-8B-v0.1-OAS-Q4_K_M-imat.gguf +- !!merge <<: *llama3 + name: "llama-3-sqlcoder-8b" + urls: + - https://huggingface.co/defog/llama-3-sqlcoder-8b + - https://huggingface.co/upendrab/llama-3-sqlcoder-8b-Q4_K_M-GGUF + license: cc-by-sa-4.0 + description: | + A capable language model for text to SQL generation for Postgres, Redshift and Snowflake that is on-par with the most capable generalist frontier models. + overrides: + parameters: + model: llama-3-sqlcoder-8b.Q4_K_M.gguf + files: + - filename: llama-3-sqlcoder-8b.Q4_K_M.gguf + sha256: b22fc704bf1405846886d9619f3eb93c40587cd58d9bda53789a17997257e023 + uri: huggingface://upendrab/llama-3-sqlcoder-8b-Q4_K_M-GGUF/llama-3-sqlcoder-8b.Q4_K_M.gguf +- !!merge <<: *llama3 + name: "sfr-iterative-dpo-llama-3-8b-r" + urls: + - https://huggingface.co/bartowski/SFR-Iterative-DPO-LLaMA-3-8B-R-GGUF + license: cc-by-nc-nd-4.0 + description: | + A capable language model for text to SQL generation for Postgres, Redshift and Snowflake that is on-par with the most capable generalist frontier models. + overrides: + parameters: + model: SFR-Iterative-DPO-LLaMA-3-8B-R-Q4_K_M.gguf + files: + - filename: SFR-Iterative-DPO-LLaMA-3-8B-R-Q4_K_M.gguf + sha256: 480703ff85af337e1db2a9d9a678a3ac8ca0802e366b14d9c59b81d3fc689da8 + uri: huggingface://bartowski/SFR-Iterative-DPO-LLaMA-3-8B-R-GGUF/SFR-Iterative-DPO-LLaMA-3-8B-R-Q4_K_M.gguf - !!merge <<: *llama3 name: "suzume-llama-3-8B-multilingual" urls: @@ -695,6 +724,40 @@ - filename: Llama-3-8B-Instruct-DPO-v0.3.Q4_K_M.gguf sha256: 694c55b5215d03e59626cd4292076eaf31610ef27ba04737166766baa75d889f uri: huggingface://MaziyarPanahi/Llama-3-8B-Instruct-DPO-v0.3-32k-GGUF/Llama-3-8B-Instruct-DPO-v0.3.Q4_K_M.gguf +- &yi-chat + url: "github:mudler/LocalAI/gallery/chatml.yaml@master" + icon: "https://raw.githubusercontent.com/01-ai/Yi/main/assets/img/Yi_logo_icon_light.svg" + name: "yi-1.5-9b-chat" + license: apache-2.0 + urls: + - https://huggingface.co/01-ai/Yi-1.5-6B-Chat + - https://huggingface.co/MaziyarPanahi/Yi-1.5-9B-Chat-GGUF + tags: + - llm + - gguf + - gpu + - cpu + - yi + overrides: + context_size: 4096 + parameters: + model: Yi-1.5-9B-Chat.Q4_K_M.gguf + files: + - filename: Yi-1.5-9B-Chat.Q4_K_M.gguf + sha256: bae824bdb0f3a333714bafffcbb64cf5cba7259902cd2f20a0fec6efbc6c1e5a + uri: huggingface://MaziyarPanahi/Yi-1.5-9B-Chat-GGUF/Yi-1.5-9B-Chat.Q4_K_M.gguf +- !!merge <<: *yi-chat + name: "yi-1.5-6b-chat" + urls: + - https://huggingface.co/01-ai/Yi-1.5-6B-Chat + - https://huggingface.co/MaziyarPanahi/Yi-1.5-6B-Chat-GGUF + overrides: + parameters: + model: Yi-1.5-6B-Chat.Q4_K_M.gguf + files: + - filename: Yi-1.5-6B-Chat.Q4_K_M.gguf + sha256: 7a0f853dbd8d38bad71ada1933fd067f45f928b2cd978aba1dfd7d5dec2953db + uri: huggingface://MaziyarPanahi/Yi-1.5-6B-Chat-GGUF/Yi-1.5-6B-Chat.Q4_K_M.gguf - &vicuna-chat ## LLama2 and derivatives ### Start Fimbulvetr