2023-12-20 10:36:01 -08:00
|
|
|
#include <stdlib.h>
|
|
|
|
|
2023-12-22 09:51:53 -08:00
|
|
|
#include "ext_server.h"
|
2023-12-20 10:36:01 -08:00
|
|
|
|
|
|
|
#ifdef __cplusplus
|
|
|
|
extern "C" {
|
|
|
|
#endif
|
|
|
|
struct dynamic_llama_server {
|
|
|
|
void *handle;
|
|
|
|
void (*llama_server_init)(ext_server_params_t *sparams,
|
|
|
|
ext_server_resp_t *err);
|
|
|
|
void (*llama_server_start)();
|
|
|
|
void (*llama_server_stop)();
|
|
|
|
void (*llama_server_completion)(const char *json_req,
|
|
|
|
ext_server_resp_t *resp);
|
|
|
|
void (*llama_server_completion_next_result)(const int task_id,
|
|
|
|
ext_server_task_result_t *result);
|
|
|
|
void (*llama_server_completion_cancel)(const int task_id,
|
|
|
|
ext_server_resp_t *err);
|
|
|
|
void (*llama_server_release_task_result)(ext_server_task_result_t *result);
|
|
|
|
void (*llama_server_tokenize)(const char *json_req, char **json_resp,
|
|
|
|
ext_server_resp_t *err);
|
|
|
|
void (*llama_server_detokenize)(const char *json_req, char **json_resp,
|
|
|
|
ext_server_resp_t *err);
|
|
|
|
void (*llama_server_embedding)(const char *json_req, char **json_resp,
|
|
|
|
ext_server_resp_t *err);
|
|
|
|
void (*llama_server_release_json_resp)(char **json_resp);
|
|
|
|
};
|
|
|
|
|
2024-01-09 20:29:58 -08:00
|
|
|
void dyn_init(const char *libPath, struct dynamic_llama_server *s,
|
2023-12-20 10:36:01 -08:00
|
|
|
ext_server_resp_t *err);
|
|
|
|
|
|
|
|
// No good way to call C function pointers from Go so inline the indirection
|
2024-01-09 20:29:58 -08:00
|
|
|
void dyn_llama_server_init(struct dynamic_llama_server s,
|
2023-12-20 10:36:01 -08:00
|
|
|
ext_server_params_t *sparams,
|
|
|
|
ext_server_resp_t *err);
|
|
|
|
|
2024-01-09 20:29:58 -08:00
|
|
|
void dyn_llama_server_start(struct dynamic_llama_server s);
|
2023-12-20 10:36:01 -08:00
|
|
|
|
2024-01-09 20:29:58 -08:00
|
|
|
void dyn_llama_server_stop(struct dynamic_llama_server s);
|
2023-12-20 10:36:01 -08:00
|
|
|
|
2024-01-09 20:29:58 -08:00
|
|
|
void dyn_llama_server_completion(struct dynamic_llama_server s,
|
2023-12-20 10:36:01 -08:00
|
|
|
const char *json_req,
|
|
|
|
ext_server_resp_t *resp);
|
|
|
|
|
2024-01-09 20:29:58 -08:00
|
|
|
void dyn_llama_server_completion_next_result(
|
2023-12-20 10:36:01 -08:00
|
|
|
struct dynamic_llama_server s, const int task_id,
|
|
|
|
ext_server_task_result_t *result);
|
|
|
|
|
2024-01-09 20:29:58 -08:00
|
|
|
void dyn_llama_server_completion_cancel(struct dynamic_llama_server s,
|
2023-12-20 10:36:01 -08:00
|
|
|
const int task_id,
|
|
|
|
ext_server_resp_t *err);
|
|
|
|
|
2024-01-09 20:29:58 -08:00
|
|
|
void dyn_llama_server_release_task_result(
|
2023-12-20 10:36:01 -08:00
|
|
|
struct dynamic_llama_server s, ext_server_task_result_t *result);
|
|
|
|
|
2024-01-09 20:29:58 -08:00
|
|
|
void dyn_llama_server_tokenize(struct dynamic_llama_server s,
|
2023-12-20 10:36:01 -08:00
|
|
|
const char *json_req, char **json_resp,
|
|
|
|
ext_server_resp_t *err);
|
|
|
|
|
2024-01-09 20:29:58 -08:00
|
|
|
void dyn_llama_server_detokenize(struct dynamic_llama_server s,
|
2023-12-20 10:36:01 -08:00
|
|
|
const char *json_req,
|
|
|
|
char **json_resp,
|
|
|
|
ext_server_resp_t *err);
|
|
|
|
|
2024-01-09 20:29:58 -08:00
|
|
|
void dyn_llama_server_embedding(struct dynamic_llama_server s,
|
2023-12-20 10:36:01 -08:00
|
|
|
const char *json_req, char **json_resp,
|
|
|
|
ext_server_resp_t *err);
|
2024-01-09 20:29:58 -08:00
|
|
|
void dyn_llama_server_release_json_resp(struct dynamic_llama_server s,
|
2023-12-20 10:36:01 -08:00
|
|
|
char **json_resp);
|
|
|
|
|
|
|
|
#ifdef __cplusplus
|
|
|
|
}
|
|
|
|
#endif
|