From 816ae7a53a00b881c9d8fc68efe2b60d5dd8b82d Mon Sep 17 00:00:00 2001 From: Ettore Di Giacinto Date: Wed, 25 Dec 2024 11:47:11 +0100 Subject: [PATCH 1/3] chore(model gallery): add fastllama-3.2-1b-instruct (#4493) Signed-off-by: Ettore Di Giacinto --- gallery/index.yaml | 15 +++++++++++++++ 1 file changed, 15 insertions(+) diff --git a/gallery/index.yaml b/gallery/index.yaml index d1a055b36db2..78df4904a862 100644 --- a/gallery/index.yaml +++ b/gallery/index.yaml @@ -964,6 +964,21 @@ - filename: Llama-Chat-Summary-3.2-3B-Q4_K_M.gguf sha256: ed1be20d2374aa6db9940923f41fa229bd7ebe13d41b1ff1ff18a6f87e99df79 uri: huggingface://bartowski/Llama-Chat-Summary-3.2-3B-GGUF/Llama-Chat-Summary-3.2-3B-Q4_K_M.gguf +- !!merge <<: *llama32 + name: "fastllama-3.2-1b-instruct" + icon: https://huggingface.co/suayptalha/FastLlama-3.2-1B-Instruct/resolve/main/FastLlama.png + urls: + - https://huggingface.co/suayptalha/FastLlama-3.2-1B-Instruct + - https://huggingface.co/bartowski/FastLlama-3.2-1B-Instruct-GGUF + description: | + FastLlama is a highly optimized version of the Llama-3.2-1B-Instruct model. Designed for superior performance in constrained environments, it combines speed, compactness, and high accuracy. This version has been fine-tuned using the MetaMathQA-50k section of the HuggingFaceTB/smoltalk dataset to enhance its mathematical reasoning and problem-solving abilities. + overrides: + parameters: + model: FastLlama-3.2-1B-Instruct-Q4_K_M.gguf + files: + - filename: FastLlama-3.2-1B-Instruct-Q4_K_M.gguf + sha256: 3c0303e9560c441a9abdcd0e4c04c47e7f6b21277c1e8c00eed94fc656da0be9 + uri: huggingface://bartowski/FastLlama-3.2-1B-Instruct-GGUF/FastLlama-3.2-1B-Instruct-Q4_K_M.gguf - &qwen25 ## Qwen2.5 name: "qwen2.5-14b-instruct" From 8f6332ab23472b4591248a2717c263ea5b389482 Mon Sep 17 00:00:00 2001 From: Ettore Di Giacinto Date: Wed, 25 Dec 2024 11:47:22 +0100 Subject: [PATCH 2/3] chore(model gallery): add dans-personalityengine-v1.1.0-12b (#4494) Signed-off-by: Ettore Di Giacinto --- gallery/index.yaml | 15 +++++++++++++++ 1 file changed, 15 insertions(+) diff --git a/gallery/index.yaml b/gallery/index.yaml index 78df4904a862..0eb95b7b96cd 100644 --- a/gallery/index.yaml +++ b/gallery/index.yaml @@ -5083,6 +5083,21 @@ - filename: NaturalLM-7B-Instruct-Q4_K_M.gguf sha256: 15b2f34116f690fea35790a9392b8a2190fe25827e370d426e88a2a543f4dcee uri: huggingface://bartowski/NaturalLM-7B-Instruct-GGUF/NaturalLM-7B-Instruct-Q4_K_M.gguf +- !!merge <<: *mistral03 + name: "dans-personalityengine-v1.1.0-12b" + url: "github:mudler/LocalAI/gallery/chatml.yaml@master" + urls: + - https://huggingface.co/PocketDoc/Dans-PersonalityEngine-V1.1.0-12b + - https://huggingface.co/bartowski/Dans-PersonalityEngine-V1.1.0-12b-GGUF + description: | + This model series is intended to be multifarious in its capabilities and should be quite capable at both co-writing and roleplay as well as find itself quite at home performing sentiment analysis or summarization as part of a pipeline. It has been trained on a wide array of one shot instructions, multi turn instructions, tool use, role playing scenarios, text adventure games, co-writing, and much more. + overrides: + parameters: + model: Dans-PersonalityEngine-V1.1.0-12b-Q4_K_M.gguf + files: + - filename: Dans-PersonalityEngine-V1.1.0-12b-Q4_K_M.gguf + sha256: a1afb9fddfa3f2847ed710cc374b4f17e63a75f7e10d8871cf83983c2f5415ab + uri: huggingface://bartowski/Dans-PersonalityEngine-V1.1.0-12b-GGUF/Dans-PersonalityEngine-V1.1.0-12b-Q4_K_M.gguf - &mudler ### START mudler's LocalAI specific-models url: "github:mudler/LocalAI/gallery/mudler.yaml@master" From 1a74af1492709173ed347cbde9ad53698b9922ac Mon Sep 17 00:00:00 2001 From: Ettore Di Giacinto Date: Wed, 25 Dec 2024 11:47:33 +0100 Subject: [PATCH 3/3] chore(model gallery): add llama-3.1-8b-open-sft (#4495) Signed-off-by: Ettore Di Giacinto --- gallery/index.yaml | 14 ++++++++++++++ 1 file changed, 14 insertions(+) diff --git a/gallery/index.yaml b/gallery/index.yaml index 0eb95b7b96cd..2a765c37a7f5 100644 --- a/gallery/index.yaml +++ b/gallery/index.yaml @@ -4193,6 +4193,20 @@ - filename: orca_mini_v8_1_70b-Q4_K_M.gguf sha256: 97627730b028d4d7a349ae0b8e219207163ec425e4e1c057e445b2a66b61fdfa uri: huggingface://bartowski/orca_mini_v8_1_70b-GGUF/orca_mini_v8_1_70b-Q4_K_M.gguf +- !!merge <<: *llama31 + name: "llama-3.1-8b-open-sft" + urls: + - https://huggingface.co/prithivMLmods/Llama-3.1-8B-Open-SFT + - https://huggingface.co/bartowski/Llama-3.1-8B-Open-SFT-GGUF + description: | + The Llama-3.1-8B-Open-SFT model is a fine-tuned version of meta-llama/Llama-3.1-8B-Instruct, designed for advanced text generation tasks, including conversational interactions, question answering, and chain-of-thought reasoning. This model leverages Supervised Fine-Tuning (SFT) using the O1-OPEN/OpenO1-SFT dataset to provide enhanced performance in context-sensitive and instruction-following tasks. + overrides: + parameters: + model: Llama-3.1-8B-Open-SFT-Q4_K_M.gguf + files: + - filename: Llama-3.1-8B-Open-SFT-Q4_K_M.gguf + sha256: ce75152763c48c5386fe59652cc921aae456da36ab82af3d9e2080f603f45132 + uri: huggingface://bartowski/Llama-3.1-8B-Open-SFT-GGUF/Llama-3.1-8B-Open-SFT-Q4_K_M.gguf - &deepseek ## Deepseek url: "github:mudler/LocalAI/gallery/deepseek.yaml@master"