You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
@@ -1785,9 +1787,9 @@ struct LLMEmbedder : public Conditioner {
1785
1787
prompt = "<|im_start|>system\nDescribe the key features of the input image (color, shape, size, texture, objects, background), then explain how the user's text instruction should alter or modify the image. Generate a new image that meets the user's requirements while maintaining consistency with the original input where appropriate.<|im_end|>\n<|im_start|>user\n";
@@ -1796,19 +1798,30 @@ struct LLMEmbedder : public Conditioner {
1796
1798
1797
1799
prompt = "[SYSTEM_PROMPT]You are an AI that reasons about image descriptions. You give structured responses focusing on object relationships, object\nattribution and actions without speculation.[/SYSTEM_PROMPT][INST]";
prompt = "<|im_start|>system\nDescribe the image by detailing the color, shape, size, texture, quantity, text, spatial relationships of the objects and background:<|im_end|>\n<|im_start|>user\n";
if (params.arch == LLMArch::MISTRAL_SMALL_3_2 || params.arch == LLMArch::QWEN3) {
1136
1166
input_pos_vec.resize(n_tokens);
1137
1167
for (int i = 0; i < n_tokens; ++i) {
1138
1168
input_pos_vec[i] = i;
@@ -1420,7 +1450,8 @@ namespace LLM {
1420
1450
1421
1451
structggml_context* work_ctx = ggml_init(params);
1422
1452
GGML_ASSERT(work_ctx != nullptr);
1423
-
bool test_mistral = true;
1453
+
bool test_mistral = false;
1454
+
bool test_qwen3 = true;
1424
1455
bool test_vit = false;
1425
1456
bool test_decoder_with_vit = false;
1426
1457
@@ -1455,9 +1486,9 @@ namespace LLM {
1455
1486
std::pair<int, int> prompt_attn_range;
1456
1487
std::string text = "<|im_start|>system\nDescribe the key features of the input image (color, shape, size, texture, objects, background), then explain how the user's text instruction should alter or modify the image. Generate a new image that meets the user's requirements while maintaining consistency with the original input where appropriate.<|im_end|>\n<|im_start|>user\n";
auto tokens_and_weights = tokenize(text, prompt_attn_range, 0, false);
@@ -1496,9 +1527,9 @@ namespace LLM {
1496
1527
} elseif (test_mistral) {
1497
1528
std::pair<int, int> prompt_attn_range;
1498
1529
std::string text = "[SYSTEM_PROMPT]You are an AI that reasons about image descriptions. You give structured responses focusing on object relationships, object\nattribution and actions without speculation.[/SYSTEM_PROMPT][INST]";
std::string text = "<|im_start|>system\nDescribe the image by detailing the color, shape, size, texture, quantity, text, spatial relationships of the objects and background:<|im_end|>\n<|im_start|>user\n";
0 commit comments