From de371b708d5f1c3923812f4838581e0f81439436 Mon Sep 17 00:00:00 2001 From: younesbelkada Date: Wed, 14 May 2025 17:07:05 +0400 Subject: [PATCH 1/4] add falcon-e support --- setup_env.py | 8 +++++++- utils/convert-hf-to-gguf-bitnet.py | 3 +++ 2 files changed, 10 insertions(+), 1 deletion(-) diff --git a/setup_env.py b/setup_env.py index dfad6c3e7..2544c5110 100644 --- a/setup_env.py +++ b/setup_env.py @@ -44,6 +44,12 @@ "microsoft/BitNet-b1.58-2B-4T": { "model_name": "BitNet-b1.58-2B-4T", }, + "tiiuae/Falcon-E-3B-Instruct": { + "model_name": "Falcon-E-3B-Instruct", + }, + "tiiuae/Falcon-E-1B-Instruct": { + "model_name": "Falcon-E-1B-Instruct", + }, } SUPPORTED_QUANT_TYPES = { @@ -144,7 +150,7 @@ def setup_gguf(): def gen_code(): _, arch = system_info() - llama3_f3_models = set([model['model_name'] for model in SUPPORTED_HF_MODELS.values() if model['model_name'].startswith("Falcon3") or model['model_name'].startswith("Llama")]) + llama3_f3_models = set([model['model_name'] for model in SUPPORTED_HF_MODELS.values() if model['model_name'].startswith("Falcon") or model['model_name'].startswith("Llama")]) if arch == "arm64": if args.use_pretuned: diff --git a/utils/convert-hf-to-gguf-bitnet.py b/utils/convert-hf-to-gguf-bitnet.py index f525f58f8..23e84384c 100644 --- a/utils/convert-hf-to-gguf-bitnet.py +++ b/utils/convert-hf-to-gguf-bitnet.py @@ -319,6 +319,9 @@ def get_vocab_base_pre(self, tokenizer) -> str: if chkhsh == "8aeee3860c56296a157a1fe2fad249ec40aa59b1bb5709f4ade11c4e6fe652ed": # ref: https://huggingface.co/tiiuae/falcon-7b res = "falcon" + if chkhsh == "a6b57017d60e6edb4d88ecc2845188e0eb333a70357e45dcc9b53964a73bbae6": + # ref: https://huggingface.co/tiiuae/Falcon-E-3B-Instruct + res = "falcon_e" if chkhsh == "0876d13b50744004aa9aeae05e7b0647eac9d801b5ba4668afc01e709c15e19f": # ref: https://huggingface.co/BAAI/bge-small-en-v1.5 res = "bert-bge" From 0015ad520190ccad48302a517e924b59be7dbc1e Mon Sep 17 00:00:00 2001 From: Younes Belkada <49240599+younesbelkada@users.noreply.github.com> Date: Thu, 15 May 2025 18:49:28 +0400 Subject: [PATCH 2/4] Update README.md --- README.md | 14 ++++++++++++++ 1 file changed, 14 insertions(+) diff --git a/README.md b/README.md index 4af4626b6..fbd9a42a8 100644 --- a/README.md +++ b/README.md @@ -136,6 +136,20 @@ This project is based on the [llama.cpp](https://github.com/ggerganov/llama.cpp) ✅ ❌ + + Falcon-E Family + 1B-3B + x86 + ✅ + ❌ + ✅ + + + ARM + ✅ + ✅ + ❌ + From f314d18863ccb58ce37b02d2f922ac9ed5178f5f Mon Sep 17 00:00:00 2001 From: Younes Belkada <49240599+younesbelkada@users.noreply.github.com> Date: Wed, 21 May 2025 04:11:07 +0400 Subject: [PATCH 3/4] feat: add also base models --- setup_env.py | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/setup_env.py b/setup_env.py index 2544c5110..f15d65f43 100644 --- a/setup_env.py +++ b/setup_env.py @@ -50,6 +50,12 @@ "tiiuae/Falcon-E-1B-Instruct": { "model_name": "Falcon-E-1B-Instruct", }, + "tiiuae/Falcon-E-3B-Base": { + "model_name": "Falcon-E-3B-Base", + }, + "tiiuae/Falcon-E-1B-Base": { + "model_name": "Falcon-E-1B-Base", + }, } SUPPORTED_QUANT_TYPES = { From 765741d80bda4d3069e367bf0062134891232cce Mon Sep 17 00:00:00 2001 From: younesbelkada Date: Wed, 21 May 2025 11:52:30 +0400 Subject: [PATCH 4/4] update submodule --- 3rdparty/llama.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/3rdparty/llama.cpp b/3rdparty/llama.cpp index 5eb47b721..40ed0f290 160000 --- a/3rdparty/llama.cpp +++ b/3rdparty/llama.cpp @@ -1 +1 @@ -Subproject commit 5eb47b72106e3b35f10e8befa616a9241242b226 +Subproject commit 40ed0f290203a9a78540b8f7eb18bd828043fe21