chat: fix build on Windows and Nomic Embed path on macOS (#2467)

* chat: remove unused oscompat source files These files are no longer needed now that the hnswlib index is gone. This fixes an issue with the Windows build as there was a compilation error in oscompat.cpp. Signed-off-by: Jared Van Bortel <jared@nomic.ai> * llm: fix pragma to be recognized by MSVC Replaces this MSVC warning: C:\msys64\home\Jared\gpt4all\gpt4all-chat\llm.cpp(53,21): warning C4081: expected '('; found 'string' With this: C:\msys64\home\Jared\gpt4all\gpt4all-chat\llm.cpp : warning : offline installer build will not check for updates! Signed-off-by: Jared Van Bortel <jared@nomic.ai> * usearch: fork usearch to fix `CreateFile` build error Signed-off-by: Jared Van Bortel <jared@nomic.ai> * dlhandle: fix incorrect assertion on Windows SetErrorMode returns the previous value of the error mode flags, not an indicator of success. Signed-off-by: Jared Van Bortel <jared@nomic.ai> * llamamodel: fix UB in LLamaModel::embedInternal It is undefined behavior to increment an STL iterator past the end of the container. Use offsets to do the math instead. Signed-off-by: Jared Van Bortel <jared@nomic.ai> * cmake: install embedding model to bundle's Resources dir on macOS Signed-off-by: Jared Van Bortel <jared@nomic.ai> * ci: fix macOS build by explicitly installing Rosetta Signed-off-by: Jared Van Bortel <jared@nomic.ai> --------- Signed-off-by: Jared Van Bortel <jared@nomic.ai>
2025-09-06 02:50:36 +00:00 · 2024-06-25 17:22:51 -04:00
parent bbf0c2f246
commit 88d85be0f9
10 changed files with 61 additions and 125 deletions
--- a/gpt4all-backend/dlhandle.cpp
+++ b/gpt4all-backend/dlhandle.cpp
@@ -46,13 +46,11 @@ Dlhandle::Dlhandle(const fs::path &fpath)

    // Suppress the "Entry Point Not Found" dialog, caused by outdated nvcuda.dll from the GPU driver
    UINT lastErrorMode = GetErrorMode();
-    UINT success = SetErrorMode(lastErrorMode | SEM_FAILCRITICALERRORS);
-    assert(success);
+    SetErrorMode(lastErrorMode | SEM_FAILCRITICALERRORS);

    chandle = LoadLibraryExW(afpath.c_str(), NULL, LOAD_LIBRARY_SEARCH_DEFAULT_DIRS | LOAD_LIBRARY_SEARCH_DLL_LOAD_DIR);

-    success = SetErrorMode(lastErrorMode);
-    assert(success);
+    SetErrorMode(lastErrorMode);

    if (!chandle) {
        DWORD err = GetLastError();
--- a/gpt4all-backend/llamamodel.cpp
+++ b/gpt4all-backend/llamamodel.cpp
@@ -1003,14 +1003,14 @@ void LLamaModel::embedInternal(
    size_t totalTokens = 0;
    for (unsigned i = 0; i < inputs.size(); i++) {
        auto &input = inputs[i];
-        for (auto it = input.begin(); it < input.end(); it += max_len) {
-            if (it > input.begin()) { it -= chunkOverlap; }
-            auto end = std::min(it + max_len, input.end());
+        for (unsigned j = 0; j < input.size(); j += max_len) {
+            if (j) { j -= chunkOverlap; }
+            unsigned end = std::min(j + max_len, unsigned(input.size()));
            batches.push_back({ i, {} });
            auto &batch = batches.back().batch;
            batch = prefixTokens;
-            batch.insert(batch.end(), it, end);
-            totalTokens += end - it;
+            batch.insert(batch.end(), input.begin() + j, input.begin() + end);
+            totalTokens += end - j;
            batch.push_back(eos_token);
            if (!doMean) { break; /* limit text to one chunk */ }
        }