Skip to content

Commit c536fa6

Browse files
committed
rename
1 parent 7a49a6f commit c536fa6

File tree

2 files changed

+12
-12
lines changed

2 files changed

+12
-12
lines changed

examples/minicpmv/README.md

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -6,14 +6,14 @@ make
66
make minicpmv-cli
77

88
python ./examples/minicpmv/minicpmv-surgery.py -m ../MiniCPM-V-2_5
9-
python ./examples/minicpmv/minicpmv-convert-image-encoder-to-gguf.py -m ../MiniCPM-V-2_5 --llava-projector ../MiniCPM-V-2_5/llava.projector --output-dir ../MiniCPM-V-2_5/ --image-mean 0.5 0.5 0.5 --image-std 0.5 0.5 0.5
9+
python ./examples/minicpmv/minicpmv-convert-image-encoder-to-gguf.py -m ../MiniCPM-V-2_5 --minicpmv-projector ../MiniCPM-V-2_5/minicpmv.projector --output-dir ../MiniCPM-V-2_5/ --image-mean 0.5 0.5 0.5 --image-std 0.5 0.5 0.5
1010
python ./convert.py ../MiniCPM-V-2_5/model --outtype f16 --vocab-type bpe
11-
./minicpmv-cli -m ../MiniCPM-V-2_5/model/ggml-model-f16.gguf --mmproj ../MiniCPM-V-2_5/mmproj-model-f16.gguf -c 4096 --temp 0.7 --top-p 0.8 --top-k 100 --repeat-penalty 1.05 --image xx.jpg -p "What is in the image?"
11+
./minicpmv-cli -m ../MiniCPM-V-2_5/model/model-8B-F16.gguf --mmproj ../MiniCPM-V-2_5/mmproj-model-f16.gguf -c 4096 --temp 0.7 --top-p 0.8 --top-k 100 --repeat-penalty 1.05 --image xx.jpg -p "What is in the image?"
1212

1313
# or run quantize int4 version
14-
./quantize ../MiniCPM-V-2_5/model/ggml-model-f16.gguf ../MiniCPM-V-2_5/model/ggml-model-Q4_K_M.gguf Q4_K_M
15-
./minicpmv-cli -m ../MiniCPM-V-2_5/model/ggml-model-Q4_K_M.gguf --mmproj ../MiniCPM-V-2_5/mmproj-model-f16.gguf -c 4096 --temp 0.6 --top-p 0.8 --top-k 100 --repeat-penalty 1.0 --image xx.jpg -p "What is in the image?"
14+
./quantize ../MiniCPM-V-2_5/model/model-8B-F16.gguf ../MiniCPM-V-2_5/model/ggml-model-Q4_K_M.gguf Q4_K_M
15+
./minicpmv-cli -m ../MiniCPM-V-2_5/model/ggml-model-Q4_K_M.gguf --mmproj ../MiniCPM-V-2_5/mmproj-model-f16.gguf -c 4096 --temp 0.7 --top-p 0.8 --top-k 100 --repeat-penalty 1.05 --image xx.jpg -p "What is in the image?"
1616

1717
# or run in interactive mode
18-
./minicpmv-cli -m ../MiniCPM-V-2_5/model/ggml-model-Q4_K_M.gguf --mmproj ../MiniCPM-V-2_5/mmproj-model-f16.gguf -c 4096 --temp 0.6 --top-p 0.8 --top-k 100 --repeat-penalty 1.0 --image xx.jpg -i
18+
./minicpmv-cli -m ../MiniCPM-V-2_5/model/ggml-model-Q4_K_M.gguf --mmproj ../MiniCPM-V-2_5/mmproj-model-f16.gguf -c 4096 --temp 0.7 --top-p 0.8 --top-k 100 --repeat-penalty 1.05 --image xx.jpg -i
1919
```

examples/minicpmv/clip.cpp

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -75,7 +75,7 @@ static std::string format(const char * fmt, ...) {
7575
#define KEY_DESCRIPTION "general.description"
7676
#define KEY_HAS_TEXT_ENC "clip.has_text_encoder"
7777
#define KEY_HAS_VIS_ENC "clip.has_vision_encoder"
78-
#define KEY_HAS_LLAVA_PROJ "clip.has_llava_projector"
78+
#define KEY_HAS_LLAVA_PROJ "clip.has_minicpmv_projector"
7979
#define KEY_USE_GELU "clip.use_gelu"
8080
#define KEY_N_EMBD "clip.%s.embedding_length"
8181
#define KEY_N_FF "clip.%s.feed_forward_length"
@@ -526,7 +526,7 @@ struct clip_vision_model {
526526
struct clip_ctx {
527527
bool has_text_encoder = false;
528528
bool has_vision_encoder = false;
529-
bool has_llava_projector = false;
529+
bool has_minicpmv_projector = false;
530530

531531
struct clip_vision_model vision_model;
532532
projector_type proj_type = PROJECTOR_TYPE_MLP;
@@ -606,7 +606,7 @@ static ggml_cgraph * clip_image_build_graph(clip_ctx * ctx, const clip_image_f32
606606

607607
const int batch_size = imgs->size;
608608

609-
if (ctx->has_llava_projector) {
609+
if (ctx->has_minicpmv_projector) {
610610
GGML_ASSERT(batch_size == 1);
611611
}
612612

@@ -1124,10 +1124,10 @@ struct clip_ctx * clip_model_load(const char * fname, const int verbosity = 1, s
11241124

11251125
idx = gguf_find_key(ctx, KEY_HAS_LLAVA_PROJ);
11261126
if (idx != -1) {
1127-
new_clip->has_llava_projector = gguf_get_val_bool(ctx, idx);
1127+
new_clip->has_minicpmv_projector = gguf_get_val_bool(ctx, idx);
11281128
}
11291129

1130-
GGML_ASSERT(new_clip->has_llava_projector); // see monatis/clip.cpp for image and/or text encoding for semantic search
1130+
GGML_ASSERT(new_clip->has_minicpmv_projector); // see monatis/clip.cpp for image and/or text encoding for semantic search
11311131
GGML_ASSERT(new_clip->has_vision_encoder);
11321132
GGML_ASSERT(!new_clip->has_text_encoder);
11331133

@@ -1137,7 +1137,7 @@ struct clip_ctx * clip_model_load(const char * fname, const int verbosity = 1, s
11371137
if (verbosity >= 1) {
11381138
LOG_TEE("%s: text_encoder: %d\n", __func__, new_clip->has_text_encoder);
11391139
LOG_TEE("%s: vision_encoder: %d\n", __func__, new_clip->has_vision_encoder);
1140-
LOG_TEE("%s: llava_projector: %d\n", __func__, new_clip->has_llava_projector);
1140+
LOG_TEE("%s: llava_projector: %d\n", __func__, new_clip->has_minicpmv_projector);
11411141
LOG_TEE("%s: model size: %.2f MB\n", __func__, model_size / 1024.0 / 1024.0);
11421142
LOG_TEE("%s: metadata size: %.2f MB\n", __func__, ggml_get_mem_size(meta) / 1024.0 / 1024.0);
11431143
}
@@ -1939,7 +1939,7 @@ bool clip_image_batch_encode(clip_ctx * ctx, const int n_threads, const clip_ima
19391939
}
19401940

19411941
int batch_size = imgs->size;
1942-
if (ctx->has_llava_projector) {
1942+
if (ctx->has_minicpmv_projector) {
19431943
GGML_ASSERT(batch_size == 1); // TODO: support multiple images
19441944
}
19451945

0 commit comments

Comments
 (0)