ollama/llama/binding/binding.h

48 lines
1.6 KiB
C
Raw Normal View History

2023-07-03 16:32:48 -04:00
#ifdef __cplusplus
#include <string>
#include <vector>
extern "C" {
#endif
#include <stdbool.h>
extern unsigned char tokenCallback(void *, char *);
2023-07-05 16:28:18 -04:00
int load_state(void *ctx, char *statefile, char *modes);
int eval(void *params_ptr, void *ctx, char *text);
void save_state(void *ctx, char *dst, char *modes);
2023-07-03 16:32:48 -04:00
void *load_model(const char *fname, int n_ctx, int n_seed, bool memory_f16,
bool mlock, bool embeddings, bool mmap, bool low_vram,
bool vocab_only, int n_gpu, int n_batch, const char *maingpu,
const char *tensorsplit, bool numa);
2023-07-05 16:28:18 -04:00
int get_embeddings(void *params_ptr, void *state_pr, float *res_embeddings);
int get_token_embeddings(void *params_ptr, void *state_pr, int *tokens,
int tokenSize, float *res_embeddings);
2023-07-03 16:32:48 -04:00
void *llama_allocate_params(
const char *prompt, int seed, int threads, int tokens, int top_k,
float top_p, float temp, float repeat_penalty, int repeat_last_n,
bool ignore_eos, bool memory_f16, int n_batch, int n_keep,
const char **antiprompt, int antiprompt_count, float tfs_z, float typical_p,
float frequency_penalty, float presence_penalty, int mirostat,
float mirostat_eta, float mirostat_tau, bool penalize_nl,
2023-07-06 17:49:05 -04:00
const char *logit_bias, bool mlock, bool mmap, const char *maingpu,
const char *tensorsplit);
2023-07-03 16:32:48 -04:00
void llama_free_params(void *params_ptr);
2023-07-05 16:28:18 -04:00
void llama_binding_free_model(void *state);
2023-07-03 16:32:48 -04:00
int llama_predict(void *params_ptr, void *state_pr, char *result, bool debug);
#ifdef __cplusplus
}
2023-07-05 16:28:18 -04:00
std::vector<std::string> create_vector(const char **strings, int count);
void delete_vector(std::vector<std::string> *vec);
#endif