text-generation-inference/backends/llamacpp/csrc/backend.hpp

30 lines
686 B
C++
Raw Normal View History

//
// Created by Morgan Funtowicz on 9/28/2024.
//
#ifndef TGI_LLAMA_CPP_BACKEND_BACKEND_HPP
#define TGI_LLAMA_CPP_BACKEND_BACKEND_HPP
#include <memory>
#include <llama.h>
namespace huggingface::tgi::backends::llama {
2024-10-04 08:42:31 +00:00
// const char* TGI_BACKEND_LLAMA_CPP_NAME = "llama.cpp";
class TgiLlamaCppBackend {
private:
llama_model* model;
llama_context* ctx;
llama_batch batch;
public:
2024-10-04 08:42:31 +00:00
TgiLlamaCppBackend(llama_model *model, llama_context *ctx);
~TgiLlamaCppBackend();
2024-10-04 08:42:31 +00:00
void schedule();
};
std::unique_ptr<TgiLlamaCppBackend> CreateLlamaCppBackend(std::string_view root);
}
#endif //TGI_LLAMA_CPP_BACKEND_BACKEND_HPP