2023-11-06 22:36:23 +01:00
# ifndef LLAVA_H
# define LLAVA_H
# include "ggml.h"
# ifdef LLAMA_SHARED
# if defined(_WIN32) && !defined(__MINGW32__)
# ifdef LLAMA_BUILD
# define LLAVA_API __declspec(dllexport)
# else
# define LLAVA_API __declspec(dllimport)
# endif
# else
# define LLAVA_API __attribute__ ((visibility ("default")))
# endif
# else
# define LLAVA_API
# endif
struct clip_ctx ;
2024-06-04 15:10:00 +08:00
struct uhd_image_embed {
std : : vector < std : : vector < struct llava_image_embed * > > image_embeds ;
} ;
2023-11-06 22:36:23 +01:00
# ifdef __cplusplus
extern " C " {
# endif
struct llava_image_embed {
float * embed ;
int n_image_pos ;
} ;
/** sanity check for clip <-> llava embed size match */
2024-03-15 22:31:05 +08:00
LLAVA_API bool llava_validate_embed_size ( const struct llama_context * ctx_llama , const struct clip_ctx * ctx_clip ) ;
2023-11-06 22:36:23 +01:00
2024-03-15 22:31:05 +08:00
LLAVA_API bool llava_image_embed_make_with_clip_img ( struct clip_ctx * ctx_clip , int n_threads , const struct clip_image_u8 * img , float * * image_embd_out , int * n_img_pos_out ) ;
2024-02-20 11:07:22 -08:00
2023-11-06 22:36:23 +01:00
/** build an image embed from image file bytes */
LLAVA_API struct llava_image_embed * llava_image_embed_make_with_bytes ( struct clip_ctx * ctx_clip , int n_threads , const unsigned char * image_bytes , int image_bytes_length ) ;
/** build an image embed from a path to an image filename */
LLAVA_API struct llava_image_embed * llava_image_embed_make_with_filename ( struct clip_ctx * ctx_clip , int n_threads , const char * image_path ) ;
LLAVA_API void llava_image_embed_free ( struct llava_image_embed * embed ) ;
/** free an embedding made with llava_image_embed_make_* */
2024-06-04 15:10:00 +08:00
/** build an image embed from image file bytes */
LLAVA_API struct uhd_image_embed * llava_image_embed_make_with_bytes_uhd ( struct clip_ctx * ctx_clip , int n_threads , const clip_image_u8 * img ) ;
/** build an image embed from a path to an image filename */
2024-06-25 18:51:06 +08:00
LLAVA_API bool llava_image_embed_make_with_clip_img_uhd ( struct clip_ctx * ctx_clip , int n_threads , const struct clip_image_u8 * img , float * * image_embd_out , int * n_img_pos_out ) ;
2024-06-04 15:10:00 +08:00
LLAVA_API bool llava_image_embed_make_with_clip_img_ollama ( struct clip_ctx * ctx_clip , int n_threads , const struct clip_image_u8 * img , float * * image_embd_out , int * n_img_pos_out ) ;
LLAVA_API struct uhd_image_embed * llava_image_embed_make_with_filename_uhd ( struct clip_ctx * ctx_clip , int n_threads , const char * image_path ) ;
LLAVA_API void llava_image_embed_free_uhd ( struct uhd_image_embed * embed ) ;
2023-11-06 22:36:23 +01:00
/** write the image represented by embed into the llama context with batch size n_batch, starting at context pos n_past. on completion, n_past points to the next position in the context after the image embed. */
LLAVA_API bool llava_eval_image_embed ( struct llama_context * ctx_llama , const struct llava_image_embed * embed , int n_batch , int * n_past ) ;
# ifdef __cplusplus
}
# endif
# endif