mtmd : refactor llava-uhd preprocessing logic (#14247)
* mtmd : refactor llava-uhd preprocessing logic * fix editorconfig
This commit is contained in:
parent
95402553a5
commit
413977de32
3 changed files with 110 additions and 80 deletions
|
@ -46,9 +46,6 @@ int32_t clip_get_hidden_size(const struct clip_ctx * ctx);
|
|||
// TODO: should be enum, not string
|
||||
const char * clip_patch_merge_type(const struct clip_ctx * ctx);
|
||||
|
||||
const int32_t * clip_image_grid(const struct clip_ctx * ctx);
|
||||
size_t get_clip_image_grid_size(const struct clip_ctx * ctx);
|
||||
|
||||
int clip_n_output_tokens(const struct clip_ctx * ctx, struct clip_image_f32 * img);
|
||||
|
||||
// for M-RoPE, this will be the number of token positions in X and Y directions
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue