74 lines
3.3 KiB
C
74 lines
3.3 KiB
C
|
#include <stdlib.h>
|
||
|
|
||
|
#include "server.h"
|
||
|
|
||
|
#ifdef __cplusplus
|
||
|
extern "C" {
|
||
|
#endif
|
||
|
struct dynamic_llama_server {
|
||
|
void *handle;
|
||
|
void (*llama_server_init)(ext_server_params_t *sparams,
|
||
|
ext_server_resp_t *err);
|
||
|
void (*llama_server_start)();
|
||
|
void (*llama_server_stop)();
|
||
|
void (*llama_server_completion)(const char *json_req,
|
||
|
ext_server_resp_t *resp);
|
||
|
void (*llama_server_completion_next_result)(const int task_id,
|
||
|
ext_server_task_result_t *result);
|
||
|
void (*llama_server_completion_cancel)(const int task_id,
|
||
|
ext_server_resp_t *err);
|
||
|
void (*llama_server_release_task_result)(ext_server_task_result_t *result);
|
||
|
void (*llama_server_tokenize)(const char *json_req, char **json_resp,
|
||
|
ext_server_resp_t *err);
|
||
|
void (*llama_server_detokenize)(const char *json_req, char **json_resp,
|
||
|
ext_server_resp_t *err);
|
||
|
void (*llama_server_embedding)(const char *json_req, char **json_resp,
|
||
|
ext_server_resp_t *err);
|
||
|
void (*llama_server_release_json_resp)(char **json_resp);
|
||
|
};
|
||
|
|
||
|
void dynamic_shim_init(const char *libPath, struct dynamic_llama_server *s,
|
||
|
ext_server_resp_t *err);
|
||
|
|
||
|
// No good way to call C function pointers from Go so inline the indirection
|
||
|
void dynamic_shim_llama_server_init(struct dynamic_llama_server s,
|
||
|
ext_server_params_t *sparams,
|
||
|
ext_server_resp_t *err);
|
||
|
|
||
|
void dynamic_shim_llama_server_start(struct dynamic_llama_server s);
|
||
|
|
||
|
void dynamic_shim_llama_server_stop(struct dynamic_llama_server s);
|
||
|
|
||
|
void dynamic_shim_llama_server_completion(struct dynamic_llama_server s,
|
||
|
const char *json_req,
|
||
|
ext_server_resp_t *resp);
|
||
|
|
||
|
void dynamic_shim_llama_server_completion_next_result(
|
||
|
struct dynamic_llama_server s, const int task_id,
|
||
|
ext_server_task_result_t *result);
|
||
|
|
||
|
void dynamic_shim_llama_server_completion_cancel(struct dynamic_llama_server s,
|
||
|
const int task_id,
|
||
|
ext_server_resp_t *err);
|
||
|
|
||
|
void dynamic_shim_llama_server_release_task_result(
|
||
|
struct dynamic_llama_server s, ext_server_task_result_t *result);
|
||
|
|
||
|
void dynamic_shim_llama_server_tokenize(struct dynamic_llama_server s,
|
||
|
const char *json_req, char **json_resp,
|
||
|
ext_server_resp_t *err);
|
||
|
|
||
|
void dynamic_shim_llama_server_detokenize(struct dynamic_llama_server s,
|
||
|
const char *json_req,
|
||
|
char **json_resp,
|
||
|
ext_server_resp_t *err);
|
||
|
|
||
|
void dynamic_shim_llama_server_embedding(struct dynamic_llama_server s,
|
||
|
const char *json_req, char **json_resp,
|
||
|
ext_server_resp_t *err);
|
||
|
void dynamic_shim_llama_server_release_json_resp(struct dynamic_llama_server s,
|
||
|
char **json_resp);
|
||
|
|
||
|
#ifdef __cplusplus
|
||
|
}
|
||
|
#endif
|