forked from ggerganov/llama.cpp
-
Notifications
You must be signed in to change notification settings - Fork 386
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
integrated libopenblas for greatly accelerated prompt processing. Win…
…dows binaries are included - feel free to build your own or to build for other platforms, but that is beyond the scope of this repo. Will fall back to non-blas if libopenblas is removed.
- Loading branch information
Showing
12 changed files
with
625 additions
and
16 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -34,4 +34,4 @@ __pycache__ | |
.swiftpm | ||
|
||
dist/ | ||
llama_for_kobold.spec | ||
*.spec |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Binary file not shown.
Binary file not shown.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Binary file not shown.
Binary file not shown.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1 +1 @@ | ||
pyinstaller --noconfirm --onefile --console --icon "./niko.ico" --add-data "./klite.embd;." --add-data "./llamacpp.dll;." "./llama_for_kobold.py" | ||
pyinstaller --noconfirm --onefile --console --icon "./niko.ico" --add-data "./klite.embd;." --add-data "./llamacpp.dll;." --add-data "./llamacpp_blas.dll;." --add-data "./libopenblas.dll;." "./llama_for_kobold.py" -n "llamacpp-for-kobold.exe" |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,133 @@ | ||
#ifndef OPENBLAS_CONFIG_H | ||
#define OPENBLAS_CONFIG_H | ||
#define OPENBLAS_OS_WINNT 1 | ||
#define OPENBLAS_ARCH_X86_64 1 | ||
#define OPENBLAS_C_GCC 1 | ||
#define OPENBLAS___64BIT__ 1 | ||
#define OPENBLAS_HAVE_C11 1 | ||
#define OPENBLAS_PTHREAD_CREATE_FUNC pthread_create | ||
#define OPENBLAS_BUNDERSCORE _ | ||
#define OPENBLAS_NEEDBUNDERSCORE 1 | ||
#define OPENBLAS_GENERIC | ||
#define OPENBLAS_L1_DATA_SIZE 32768 | ||
#define OPENBLAS_L1_DATA_LINESIZE 128 | ||
#define OPENBLAS_L2_SIZE 512488 | ||
#define OPENBLAS_L2_LINESIZE 128 | ||
#define OPENBLAS_DTB_DEFAULT_ENTRIES 128 | ||
#define OPENBLAS_DTB_SIZE 4096 | ||
#define OPENBLAS_L2_ASSOCIATIVE 8 | ||
#define OPENBLAS_CORE_generic | ||
#define OPENBLAS_CHAR_CORENAME "generic" | ||
#define OPENBLAS_SLOCAL_BUFFER_SIZE 4096 | ||
#define OPENBLAS_DLOCAL_BUFFER_SIZE 4096 | ||
#define OPENBLAS_CLOCAL_BUFFER_SIZE 8192 | ||
#define OPENBLAS_ZLOCAL_BUFFER_SIZE 8192 | ||
#define OPENBLAS_GEMM_MULTITHREAD_THRESHOLD 4 | ||
#define OPENBLAS_VERSION " OpenBLAS 0.3.22 " | ||
/*This is only for "make install" target.*/ | ||
|
||
#if defined(OPENBLAS_OS_WINNT) || defined(OPENBLAS_OS_CYGWIN_NT) || defined(OPENBLAS_OS_INTERIX) | ||
#define OPENBLAS_WINDOWS_ABI | ||
#define OPENBLAS_OS_WINDOWS | ||
|
||
#ifdef DOUBLE | ||
#define DOUBLE_DEFINED DOUBLE | ||
#undef DOUBLE | ||
#endif | ||
#endif | ||
|
||
#ifdef OPENBLAS_NEEDBUNDERSCORE | ||
#define BLASFUNC(FUNC) FUNC##_ | ||
#else | ||
#define BLASFUNC(FUNC) FUNC | ||
#endif | ||
|
||
#ifdef OPENBLAS_QUAD_PRECISION | ||
typedef struct { | ||
unsigned long x[2]; | ||
} xdouble; | ||
#elif defined OPENBLAS_EXPRECISION | ||
#define xdouble long double | ||
#else | ||
#define xdouble double | ||
#endif | ||
|
||
#if defined(OPENBLAS_OS_WINDOWS) && defined(OPENBLAS___64BIT__) | ||
typedef long long BLASLONG; | ||
typedef unsigned long long BLASULONG; | ||
#else | ||
typedef long BLASLONG; | ||
typedef unsigned long BLASULONG; | ||
#endif | ||
|
||
#ifndef BFLOAT16 | ||
#include <stdint.h> | ||
typedef uint16_t bfloat16; | ||
#endif | ||
|
||
#ifdef OPENBLAS_USE64BITINT | ||
typedef BLASLONG blasint; | ||
#else | ||
typedef int blasint; | ||
#endif | ||
|
||
#if defined(XDOUBLE) || defined(DOUBLE) | ||
#define FLOATRET FLOAT | ||
#else | ||
#ifdef NEED_F2CCONV | ||
#define FLOATRET double | ||
#else | ||
#define FLOATRET float | ||
#endif | ||
#endif | ||
|
||
/* Inclusion of a standard header file is needed for definition of __STDC_* | ||
predefined macros with some compilers (e.g. GCC 4.7 on Linux). This occurs | ||
as a side effect of including either <features.h> or <stdc-predef.h>. */ | ||
#include <stdio.h> | ||
|
||
/* C99 supports complex floating numbers natively, which GCC also offers as an | ||
extension since version 3.0. If neither are available, use a compatible | ||
structure as fallback (see Clause 6.2.5.13 of the C99 standard). */ | ||
#if ((defined(__STDC_IEC_559_COMPLEX__) || __STDC_VERSION__ >= 199901L || \ | ||
(__GNUC__ >= 3 && !defined(__cplusplus))) && !(defined(FORCE_OPENBLAS_COMPLEX_STRUCT))) && !defined(_MSC_VER) | ||
#define OPENBLAS_COMPLEX_C99 | ||
#ifndef __cplusplus | ||
#include <complex.h> | ||
#endif | ||
typedef float _Complex openblas_complex_float; | ||
typedef double _Complex openblas_complex_double; | ||
typedef xdouble _Complex openblas_complex_xdouble; | ||
#define openblas_make_complex_float(real, imag) ((real) + ((imag) * _Complex_I)) | ||
#define openblas_make_complex_double(real, imag) ((real) + ((imag) * _Complex_I)) | ||
#define openblas_make_complex_xdouble(real, imag) ((real) + ((imag) * _Complex_I)) | ||
#define openblas_complex_float_real(z) (creal(z)) | ||
#define openblas_complex_float_imag(z) (cimag(z)) | ||
#define openblas_complex_double_real(z) (creal(z)) | ||
#define openblas_complex_double_imag(z) (cimag(z)) | ||
#define openblas_complex_xdouble_real(z) (creal(z)) | ||
#define openblas_complex_xdouble_imag(z) (cimag(z)) | ||
#else | ||
#define OPENBLAS_COMPLEX_STRUCT | ||
typedef struct { float real, imag; } openblas_complex_float; | ||
typedef struct { double real, imag; } openblas_complex_double; | ||
typedef struct { xdouble real, imag; } openblas_complex_xdouble; | ||
#define openblas_make_complex_float(real, imag) {(real), (imag)} | ||
#define openblas_make_complex_double(real, imag) {(real), (imag)} | ||
#define openblas_make_complex_xdouble(real, imag) {(real), (imag)} | ||
#define openblas_complex_float_real(z) ((z).real) | ||
#define openblas_complex_float_imag(z) ((z).imag) | ||
#define openblas_complex_double_real(z) ((z).real) | ||
#define openblas_complex_double_imag(z) ((z).imag) | ||
#define openblas_complex_xdouble_real(z) ((z).real) | ||
#define openblas_complex_xdouble_imag(z) ((z).imag) | ||
#endif | ||
|
||
/* Inclusion of Linux-specific header is needed for definition of cpu_set_t. */ | ||
#ifdef OPENBLAS_OS_LINUX | ||
#ifndef _GNU_SOURCE | ||
#define _GNU_SOURCE | ||
#endif | ||
#include <sched.h> | ||
#endif | ||
#endif /* OPENBLAS_CONFIG_H */ |
664b277
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Fails to compile on Linux(Arch) now. Have openBLAS installed. And when I mess with it so it does compile, it tries to use the Windows Dll anyway.
664b277
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Ahh that's a problem. Can I confirm that it was working fine for you before I integrated OpenBLAS? I might have to add some platform specific flags.
664b277
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Yeah, 49c4c22 is fine. I was already linking openBLAS when compiling before and everything was working. https://gist.github.com/rabidcopy/b21c11466ff03c252d9d8a4f5f65c7ce (ignore the compile warnings, that is due to a recent merged PR on llama.cpp)
664b277
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Hi @rabidcopy , thanks for the help to test. I have added a few flags that should prevent build errors - can you try your usual build workflow again with the newest commit?
If you have openblas installed, I assume you normally build with LLAMA_OPENBLAS=1? Let me know if everything works now.
664b277
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Seems good now. Thanks for the fix! https://gist.github.com/rabidcopy/7af97cd87aa7f529c550a1bbdbaad2d6 It shows BLAS = 1, so think everything is working as intended.