Latest rebase on llama.cpp with gguf support.

2025-10-28 20:30:26 +00:00 · 2023-09-21 12:41:48 -04:00
parent 5f3d739205
commit d90d003a1d
12 changed files with 245 additions and 85 deletions
--- a/gpt4all-backend/bert.cpp
+++ b/gpt4all-backend/bert.cpp
@@ -345,7 +345,7 @@ void bert_eval(

    // embd norm
    {
-        inpL = ggml_norm(ctx0, inpL);
+        inpL = ggml_norm(ctx0, inpL, 1e-5f);

        inpL = ggml_add(ctx0,
                        ggml_mul(ctx0,
@@ -406,7 +406,7 @@ void bert_eval(

        // attention norm
        {
-            cur = ggml_norm(ctx0, cur);
+            cur = ggml_norm(ctx0, cur, 1e-5f);

            cur = ggml_add(ctx0,
                           ggml_mul(ctx0,
@@ -432,7 +432,7 @@ void bert_eval(

        // output norm
        {
-            cur = ggml_norm(ctx0, cur);
+            cur = ggml_norm(ctx0, cur, 1e-5f);

            cur = ggml_add(ctx0,
                           ggml_mul(ctx0,
@@ -1038,13 +1038,16 @@ DLL_EXPORT const char *get_build_variant() {
    return GGML_BUILD_VARIANT;
 }

-DLL_EXPORT bool magic_match(std::istream& f) {
+DLL_EXPORT bool magic_match(const char* fname) {
+#if 0
    uint32_t magic = 0;
    f.read(reinterpret_cast<char*>(&magic), sizeof(magic));
    if (magic != 0x62657274) {
         return false;
    }
    return true;
+#endif
+    return false;
 }

 DLL_EXPORT LLModel *construct() {