feat(backend): minor refactor

2024-10-23 14:12:32 +02:00 · 2024-10-23 14:12:32 +02:00 · d4b5be10f9
parent 92bb113653
commit d4b5be10f9
2 changed files with 2 additions and 3 deletions
--- a/backends/llamacpp/csrc/backend.cpp
+++ b/backends/llamacpp/csrc/backend.cpp
@ -123,7 +123,7 @@ namespace huggingface::tgi::backends::llama {
 #else
            const auto status = llama_decode(ctx, batch);
 #endif
-            if (status == LLAMA_SUCCESS) {
+            if (LLAMA_SUCCESS(status)) {
                // Sample the new token
                auto new_token_id = llama_sampler_sample(*sampler, ctx, -1);
                generated.emplace_back(new_token_id);
@ -133,7 +133,6 @@ namespace huggingface::tgi::backends::llama {
                batch = llama_batch_get_one(&new_token_id, 1);
            }
        }
-        generated.shrink_to_fit();
        return generated;
    }
 }
--- a/backends/llamacpp/csrc/backend.hpp
+++ b/backends/llamacpp/csrc/backend.hpp
@ -10,7 +10,7 @@
 #include <memory>
 #include <llama.h>

-#define LLAMA_SUCCESS 0
+#define LLAMA_SUCCESS(x) x == 0

 namespace huggingface::tgi::backends::llama {
    enum TgiLlamaCppBackendError {