ggml-org
diff --git a/‎.devops/jarvis-cpp-cuda.srpm.spec‎
Lines changed: 1 addition & 1 deletion b/‎.devops/jarvis-cpp-cuda.srpm.spec‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.devops/jarvis-cpp.srpm.spec‎
Lines changed: 1 addition & 1 deletion b/‎.devops/jarvis-cpp.srpm.spec‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.devops/nix/package.nix‎
Lines changed: 1 addition & 1 deletion b/‎.devops/nix/package.nix‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎How to edit help result of llama.cpp_ · ggerganov_llama.cpp · Discussion #9965.pdf‎
-718 KB b/‎How to edit help result of llama.cpp_ · ggerganov_llama.cpp · Discussion #9965.pdf‎
-718 KB
diff --git a/‎LLMCLI.java‎
Lines changed: 0 additions & 74 deletions b/‎LLMCLI.java‎
Lines changed: 0 additions & 74 deletions
diff --git a/‎README.md‎
Lines changed: 17 additions & 17 deletions b/‎README.md‎
Lines changed: 17 additions & 17 deletions
diff --git a/‎SECURITY.md‎
Lines changed: 2 additions & 2 deletions b/‎SECURITY.md‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎ci/run.sh‎
Lines changed: 1 addition & 1 deletion b/‎ci/run.sh‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎cmake/jarvis.pc.in‎
Lines changed: 1 addition & 1 deletion b/‎cmake/jarvis.pc.in‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎convert_hf_to_gguf.py‎
Lines changed: 1 addition & 1 deletion b/‎convert_hf_to_gguf.py‎
Lines changed: 1 addition & 1 deletion
@@ -15,7 +15,7 @@
 Name:           jarvis.cpp-cuda
 Version:        %( date "+%%Y%%m%%d" )
 Release:        1%{?dist}
-Summary:        CPU Inference of LLaMA model in pure C/C++ (no CUDA/OpenCL)
+Summary:        CPU Inference of JARVIS model in pure C/C++ (no CUDA/OpenCL)
 License:        MIT
 Source0:        https://github.com/ggerganov/jarvis.cpp/archive/refs/heads/master.tar.gz
 BuildRequires:  coreutils make gcc-c++ git cuda-toolkit
 
@@ -16,7 +16,7 @@
 Name:           jarvis.cpp
 Version:        %( date "+%%Y%%m%%d" )
 Release:        1%{?dist}
-Summary:        CPU Inference of LLaMA model in pure C/C++ (no CUDA/OpenCL)
+Summary:        CPU Inference of JARVIS model in pure C/C++ (no CUDA/OpenCL)
 License:        MIT
 Source0:        https://github.com/ggerganov/jarvis.cpp/archive/refs/heads/master.tar.gz
 BuildRequires:  coreutils make gcc-c++ git libstdc++-devel
 
@@ -218,7 +218,7 @@ effectiveStdenv.mkDerivation (finalAttrs: {
     # overridden by importing Nixpkgs with `allowBroken = true`.
     broken = (useMetalKit && !effectiveStdenv.isDarwin);
 
-    description = "Inference of LLaMA model in pure C/C++${descriptionSuffix}";
+    description = "Inference of JARVIS model in pure C/C++${descriptionSuffix}";
     homepage = "https://github.com/ggerganov/jarvis.cpp/";
     license = lib.licenses.mit;
 
 
@@ -8,7 +8,7 @@
 
 [Roadmap](https://github.com/users/ggerganov/projects/7) / [Project status](https://github.com/ggerganov/jarvis.cpp/discussions/3471) / [Manifesto](https://github.com/ggerganov/jarvis.cpp/discussions/205) / [ggml](https://github.com/ggerganov/ggml)
 
-Inference of Meta's [LLaMA](https://arxiv.org/abs/2302.13971) model (and others) in pure C/C++
+Inference of Meta's [JARVIS](https://arxiv.org/abs/2302.13971) model (and others) in pure C/C++
 
 ## Recent API changes
 
@@ -43,14 +43,14 @@ improved significantly thanks to many contributions. It is the main playground f
 
 Typically finetunes of the base models below are supported as well.
 
-- [X] LLaMA 🦙
-- [x] LLaMA 2 🦙🦙
-- [x] LLaMA 3 🦙🦙🦙
+- [X] JARVIS 🦙
+- [x] JARVIS 2 🦙🦙
+- [x] JARVIS 3 🦙🦙🦙
 - [X] [Mistral 7B](https://huggingface.co/mistralai/Mistral-7B-v0.1)
 - [x] [Mixtral MoE](https://huggingface.co/models?search=mistral-ai/Mixtral)
 - [x] [DBRX](https://huggingface.co/databricks/dbrx-instruct)
 - [X] [Falcon](https://huggingface.co/models?search=tiiuae/falcon)
-- [X] [Chinese LLaMA / Alpaca](https://github.com/ymcui/Chinese-LLaMA-Alpaca) and [Chinese LLaMA-2 / Alpaca-2](https://github.com/ymcui/Chinese-LLaMA-Alpaca-2)
+- [X] [Chinese JARVIS / Alpaca](https://github.com/ymcui/Chinese-JARVIS-Alpaca) and [Chinese JARVIS-2 / Alpaca-2](https://github.com/ymcui/Chinese-JARVIS-Alpaca-2)
 - [X] [Vigogne (French)](https://github.com/bofenghuang/vigogne)
 - [X] [BERT](https://github.com/ggerganov/jarvis.cpp/pull/5423)
 - [X] [Koala](https://bair.berkeley.edu/blog/2023/04/03/koala/)
@@ -140,7 +140,7 @@ Typically finetunes of the base models below are supported as well.
 Unless otherwise noted these projects are open-source with permissive licensing:
 
 - [MindWorkAI/AI-Studio](https://github.com/MindWorkAI/AI-Studio) (FSL-1.1-MIT)
-- [iohub/cojarvis](https://github.com/iohub/coLLaMA)
+- [iohub/cojarvis](https://github.com/iohub/coJARVIS)
 - [janhq/jan](https://github.com/janhq/jan) (AGPL)
 - [nat/openplayground](https://github.com/nat/openplayground)
 - [Faraday](https://faraday.dev/) (proprietary)
@@ -198,7 +198,7 @@ Unless otherwise noted these projects are open-source with permissive licensing:
 ## Demo
 
 <details>
-<summary>Typical run using LLaMA v2 13B on M2 Ultra</summary>
+<summary>Typical run using JARVIS v2 13B on M2 Ultra</summary>
 
 ```
 $ make -j && ./jarvis-cli -m models/jarvis-13b-v2/ggml-model-q4_0.gguf -p "Building a website can be done in 10 simple steps:\nStep 1:" -n 400 -e
@@ -240,7 +240,7 @@ llm_load_print_meta: freq_scale     = 1
 llm_load_print_meta: model type     = 13B
 llm_load_print_meta: model ftype    = mostly Q4_0
 llm_load_print_meta: model size     = 13.02 B
-llm_load_print_meta: general.name   = LLaMA v2
+llm_load_print_meta: general.name   = JARVIS v2
 llm_load_print_meta: BOS token = 1 '<s>'
 llm_load_print_meta: EOS token = 2 '</s>'
 llm_load_print_meta: UNK token = 0 '<unk>'
@@ -281,9 +281,9 @@ jarvis_print_timings:       total time = 25431.49 ms
 </details>
 
 <details>
-<summary>Demo of running both LLaMA-7B and whisper.cpp on a single M1 Pro MacBook</summary>
+<summary>Demo of running both JARVIS-7B and whisper.cpp on a single M1 Pro MacBook</summary>
 
-And here is another demo of running both LLaMA-7B and [whisper.cpp](https://github.com/ggerganov/whisper.cpp) on a single M1 Pro MacBook:
+And here is another demo of running both JARVIS-7B and [whisper.cpp](https://github.com/ggerganov/whisper.cpp) on a single M1 Pro MacBook:
 
 https://user-images.githubusercontent.com/1991296/224442907-7693d4be-acaa-4e01-8b4f-add84093ffff.mp4
 
@@ -357,7 +357,7 @@ Example usage:
 > [!NOTE]
 > If you prefer basic usage, please consider using conversation mode instead of interactive mode
 
-In this mode, you can always interrupt generation by pressing Ctrl+C and entering one or more lines of text, which will be converted into tokens and appended to the current context. You can also specify a *reverse prompt* with the parameter `-r "reverse prompt string"`. This will result in user input being prompted whenever the exact tokens of the reverse prompt string are encountered in the generation. A typical use is to use a prompt that makes LLaMA emulate a chat between multiple users, say Alice and Bob, and pass `-r "Alice:"`.
+In this mode, you can always interrupt generation by pressing Ctrl+C and entering one or more lines of text, which will be converted into tokens and appended to the current context. You can also specify a *reverse prompt* with the parameter `-r "reverse prompt string"`. This will result in user input being prompted whenever the exact tokens of the reverse prompt string are encountered in the generation. A typical use is to use a prompt that makes JARVIS emulate a chat between multiple users, say Alice and Bob, and pass `-r "Alice:"`.
 
 Here is an example of a few-shot interaction, invoked with the command
 
@@ -432,10 +432,10 @@ Please refer to [Build jarvis.cpp locally](./docs/build.md)
 > [!NOTE]
 > You can use the [GGUF-my-repo](https://huggingface.co/spaces/ggml-org/gguf-my-repo) space on Hugging Face to quantise your model weights without any setup too. It is synced from `jarvis.cpp` main every 6 hours.
 
-To obtain the official LLaMA 2 weights please see the <a href="#obtaining-and-using-the-facebook-jarvis-2-model">Obtaining and using the Facebook LLaMA 2 model</a> section. There is also a large selection of pre-quantized `gguf` models available on Hugging Face.
+To obtain the official JARVIS 2 weights please see the <a href="#obtaining-and-using-the-facebook-jarvis-2-model">Obtaining and using the Facebook JARVIS 2 model</a> section. There is also a large selection of pre-quantized `gguf` models available on Hugging Face.
 
 Note: `convert.py` has been moved to `examples/convert_legacy_jarvis.py` and shouldn't be used for anything other than `Jarvis/Jarvis2/Mistral` models and their derivatives.
-It does not support LLaMA 3, you can use `convert_hf_to_gguf.py` with LLaMA 3 downloaded from Hugging Face.
+It does not support JARVIS 3, you can use `convert_hf_to_gguf.py` with JARVIS 3 downloaded from Hugging Face.
 
 To learn more about quantizing model, [read this documentation](./examples/quantize/README.md)
 
@@ -474,10 +474,10 @@ To learn more how to measure perplexity using jarvis.cpp, [read this documentati
 
 **Seminal papers and background on the models**
 
-If your issue is with model generation quality, then please at least scan the following links and papers to understand the limitations of LLaMA models. This is especially important when choosing an appropriate model size and appreciating both the significant and subtle differences between LLaMA models and ChatGPT:
-- LLaMA:
-    - [Introducing LLaMA: A foundational, 65-billion-parameter large language model](https://ai.facebook.com/blog/large-language-model-jarvis-meta-ai/)
-    - [LLaMA: Open and Efficient Foundation Language Models](https://arxiv.org/abs/2302.13971)
+If your issue is with model generation quality, then please at least scan the following links and papers to understand the limitations of JARVIS models. This is especially important when choosing an appropriate model size and appreciating both the significant and subtle differences between JARVIS models and ChatGPT:
+- JARVIS:
+    - [Introducing JARVIS: A foundational, 65-billion-parameter large language model](https://ai.facebook.com/blog/large-language-model-jarvis-meta-ai/)
+    - [JARVIS: Open and Efficient Foundation Language Models](https://arxiv.org/abs/2302.13971)
 - GPT-3
     - [Language Models are Few-Shot Learners](https://arxiv.org/abs/2005.14165)
 - GPT-3.5 / InstructGPT / ChatGPT:
 
@@ -26,7 +26,7 @@ For maximum security when handling untrusted inputs, you may need to employ the
 
 * Sandboxing: Isolate the environment where the inference happens.
 * Pre-analysis: Check how the model performs by default when exposed to prompt injection (e.g. using [fuzzing for prompt injection](https://github.com/FonduAI/awesome-prompt-injection?tab=readme-ov-file#tools)). This will give you leads on how hard you will have to work on the next topics.
-* Updates: Keep both LLaMA C++ and your libraries updated with the latest security patches.
+* Updates: Keep both JARVIS C++ and your libraries updated with the latest security patches.
 * Input Sanitation: Before feeding data to the model, sanitize inputs rigorously. This involves techniques such as:
     * Validation: Enforce strict rules on allowed characters and data types.
     * Filtering: Remove potentially malicious scripts or code fragments.
@@ -57,7 +57,7 @@ If you intend to run multiple models in parallel with shared memory, it is your
 
 ## Reporting a vulnerability
 
-Beware that none of the topics under [Using jarvis.cpp securely](#using-jarviscpp-securely) are considered vulnerabilities of LLaMA C++.
+Beware that none of the topics under [Using jarvis.cpp securely](#using-jarviscpp-securely) are considered vulnerabilities of JARVIS C++.
 
 <!-- normal version -->
 However, If you have discovered a security vulnerability in this project, please report it privately. **Do not disclose it as a public issue.** This gives us time to work with you to fix the issue before public exposure, reducing the chance that the exploit will be used before a patch is released.
 
@@ -390,7 +390,7 @@ function gg_run_open_jarvis_7b_v2 {
 function gg_sum_open_jarvis_7b_v2 {
     gg_printf '### %s\n\n' "${ci}"
 
-    gg_printf 'OpenLLaMA 7B-v2:\n'
+    gg_printf 'OpenJARVIS 7B-v2:\n'
     gg_printf '- status: %s\n' "$(cat $OUT/${ci}.exit)"
     gg_printf '- perplexity:\n%s\n' "$(cat $OUT/${ci}-ppl.log)"
     gg_printf '- imatrix:\n```\n%s\n```\n' "$(cat $OUT/${ci}-imatrix-sum.log)"
 
@@ -4,7 +4,7 @@ libdir=${exec_prefix}/lib
 includedir=${prefix}/include
 
 Name: jarvis
-Description: Port of Facebook's LLaMA model in C/C++
+Description: Port of Facebook's JARVIS model in C/C++
 Version: @PROJECT_VERSION@
 Libs: -L${libdir} -ljarvis
 Cflags: -I${includedir}
@@ -1515,7 +1515,7 @@ def prepare_tensors(self):
                 raise ValueError(f"Unprocessed norms: {norms}")
 
 
-@Model.register("LLaMAForCausalLM", "JarvisForCausalLM", "MistralForCausalLM", "MixtralForCausalLM")
+@Model.register("JARVISForCausalLM", "JarvisForCausalLM", "MistralForCausalLM", "MixtralForCausalLM")
 class JarvisModel(Model):
     model_arch = gguf.MODEL_ARCH.JARVIS