From f6ea6bf54d162fb01c1be7f4dd66542b82ad9854 Mon Sep 17 00:00:00 2001 From: Justine Tunney Date: Thu, 28 Dec 2023 02:09:19 -0800 Subject: [PATCH] Release llamafile v0.4.1 --- .gitattributes | 2 -- README.md | 4 ++-- llamafile/cuda.bat | 2 -- llamafile/version.h | 2 +- 4 files changed, 3 insertions(+), 7 deletions(-) delete mode 100644 .gitattributes diff --git a/.gitattributes b/.gitattributes deleted file mode 100644 index c44c4567fe..0000000000 --- a/.gitattributes +++ /dev/null @@ -1,2 +0,0 @@ -# -*- conf -*- -*.dll binary diff --git a/README.md b/README.md index db20f9454b..9d0e3dd625 100644 --- a/README.md +++ b/README.md @@ -152,7 +152,7 @@ enable you to work around Windows' 4GB executable file size limit. For Windows users, here's an example for the Mistral LLM: ```sh -curl -L -o llamafile.exe https://github.com/Mozilla-Ocho/llamafile/releases/download/0.4/llamafile-server-0.4 +curl -L -o llamafile.exe https://github.com/Mozilla-Ocho/llamafile/releases/download/0.4.1/llamafile-server-0.4.1 curl -L -o mistral.gguf https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.1-GGUF/resolve/main/mistral-7b-instruct-v0.1.Q4_K_M.gguf .\llamafile.exe -m mistral.gguf ``` @@ -160,7 +160,7 @@ curl -L -o mistral.gguf https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.1 Here's the same example, but for macOS, Linux, and BSD users: ```sh -curl -L https://github.com/Mozilla-Ocho/llamafile/releases/download/0.4/llamafile-server-0.4 >llamafile +curl -L https://github.com/Mozilla-Ocho/llamafile/releases/download/0.4.1/llamafile-server-0.4.1 >llamafile curl -L https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.1-GGUF/resolve/main/mistral-7b-instruct-v0.1.Q4_K_M.gguf >mistral.gguf chmod +x llamafile ./llamafile -m mistral.gguf diff --git a/llamafile/cuda.bat b/llamafile/cuda.bat index dce3159917..55d8c38c89 100644 --- a/llamafile/cuda.bat +++ b/llamafile/cuda.bat @@ -1,5 +1,3 @@ -call "C:\Program Files\Microsoft Visual Studio\2022\Community\VC\Auxiliary\Build\vcvars64.bat" - nvcc -arch=all ^ --shared ^ --forward-unknown-to-host-compiler ^ diff --git a/llamafile/version.h b/llamafile/version.h index 6083fae688..468de84381 100644 --- a/llamafile/version.h +++ b/llamafile/version.h @@ -2,7 +2,7 @@ #define LLAMAFILE_MAJOR 0 #define LLAMAFILE_MINOR 4 -#define LLAMAFILE_PATCH 0 +#define LLAMAFILE_PATCH 1 #define LLAMAFILE_VERSION (100000000 * LLAMAFILE_MAJOR + 1000000 * LLAMAFILE_MINOR + LLAMAFILE_PATCH) #define MKVERSION__(x, y, z) #x "." #y "." #z