leejet
diff --git a/‎CMakeLists.txt‎
Lines changed: 2 additions & 0 deletions b/‎CMakeLists.txt‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎format-code.sh‎
Lines changed: 1 addition & 1 deletion b/‎format-code.sh‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/clip.hpp‎
Lines changed: 2 additions & 1 deletion b/‎src/clip.hpp‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎src/llm.hpp‎
Lines changed: 3 additions & 2 deletions b/‎src/llm.hpp‎
Lines changed: 3 additions & 2 deletions
diff --git a/‎src/model.cpp‎
Lines changed: 0 additions & 34 deletions b/‎src/model.cpp‎
Lines changed: 0 additions & 34 deletions
diff --git a/‎src/model.h‎
Lines changed: 0 additions & 7 deletions b/‎src/model.h‎
Lines changed: 0 additions & 7 deletions
diff --git a/‎src/stable-diffusion.cpp‎
Lines changed: 2 additions & 2 deletions b/‎src/stable-diffusion.cpp‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎src/t5.hpp‎
Lines changed: 3 additions & 2 deletions b/‎src/t5.hpp‎
Lines changed: 3 additions & 2 deletions
@@ -90,6 +90,8 @@ file(GLOB SD_LIB_SOURCES
     "src/*.h"
     "src/*.cpp"
     "src/*.hpp"
+    "src/vocab/*.h"
+    "src/vocab/*.cpp"
 )
 
 find_program(GIT_EXE NAMES git git.exe NO_CMAKE_FIND_ROOT_PATH)
 
@@ -1,4 +1,4 @@
-for f in *.cpp *.h *.hpp examples/cli/*.cpp examples/common/*.hpp examples/cli/*.h examples/server/*.cpp; do
+for f in src/*.cpp src/*.h src/*.hpp src/vocab/*.h src/vocab/*.cpp examples/cli/*.cpp examples/common/*.hpp examples/cli/*.h examples/server/*.cpp; do
   [[ "$f" == vocab* ]] && continue
   echo "formatting '$f'"
   # if [ "$f" != "stable-diffusion.h" ]; then
 
@@ -4,6 +4,7 @@
 #include "ggml_extend.hpp"
 #include "model.h"
 #include "tokenize_util.h"
+#include "vocab/vocab.h"
 
 /*================================================== CLIPTokenizer ===================================================*/
 
@@ -110,7 +111,7 @@ class CLIPTokenizer {
         if (merges_utf8_str.size() > 0) {
             load_from_merges(merges_utf8_str);
         } else {
-            load_from_merges(ModelLoader::load_merges());
+            load_from_merges(load_clip_merges());
         }
         add_special_token("<|startoftext|>");
         add_special_token("<|endoftext|>");
 
@@ -19,6 +19,7 @@
 #include "json.hpp"
 #include "rope.hpp"
 #include "tokenize_util.h"
+#include "vocab/vocab.h"
 
 namespace LLM {
     constexpr int LLM_GRAPH_SIZE = 10240;
@@ -365,7 +366,7 @@ namespace LLM {
             if (merges_utf8_str.size() > 0) {
                 load_from_merges(merges_utf8_str);
             } else {
-                load_from_merges(ModelLoader::load_qwen2_merges());
+                load_from_merges(load_qwen2_merges());
             }
         }
     };
@@ -466,7 +467,7 @@ namespace LLM {
             if (merges_utf8_str.size() > 0 && vocab_utf8_str.size() > 0) {
                 load_from_merges(merges_utf8_str, vocab_utf8_str);
             } else {
-                load_from_merges(ModelLoader::load_mistral_merges(), ModelLoader::load_mistral_vocab_json());
+                load_from_merges(load_mistral_merges(), load_mistral_vocab_json());
             }
         }
     };
 
@@ -16,10 +16,6 @@
 #include "model.h"
 #include "stable-diffusion.h"
 #include "util.h"
-#include "vocab.hpp"
-#include "vocab_mistral.hpp"
-#include "vocab_qwen.hpp"
-#include "vocab_umt5.hpp"
 
 #include "ggml-alloc.h"
 #include "ggml-backend.h"
@@ -1340,36 +1336,6 @@ void ModelLoader::set_wtype_override(ggml_type wtype, std::string tensor_type_ru
     }
 }
 
-std::string ModelLoader::load_merges() {
-    std::string merges_utf8_str(reinterpret_cast<const char*>(merges_utf8_c_str), sizeof(merges_utf8_c_str));
-    return merges_utf8_str;
-}
-
-std::string ModelLoader::load_qwen2_merges() {
-    std::string merges_utf8_str(reinterpret_cast<const char*>(qwen2_merges_utf8_c_str), sizeof(qwen2_merges_utf8_c_str));
-    return merges_utf8_str;
-}
-
-std::string ModelLoader::load_mistral_merges() {
-    std::string merges_utf8_str(reinterpret_cast<const char*>(mistral_merges_utf8_c_str), sizeof(mistral_merges_utf8_c_str));
-    return merges_utf8_str;
-}
-
-std::string ModelLoader::load_mistral_vocab_json() {
-    std::string json_str(reinterpret_cast<const char*>(mistral_vocab_json_utf8_c_str), sizeof(mistral_vocab_json_utf8_c_str));
-    return json_str;
-}
-
-std::string ModelLoader::load_t5_tokenizer_json() {
-    std::string json_str(reinterpret_cast<const char*>(t5_tokenizer_json_str), sizeof(t5_tokenizer_json_str));
-    return json_str;
-}
-
-std::string ModelLoader::load_umt5_tokenizer_json() {
-    std::string json_str(reinterpret_cast<const char*>(umt5_tokenizer_json_str), sizeof(umt5_tokenizer_json_str));
-    return json_str;
-}
-
 bool ModelLoader::load_tensors(on_new_tensor_cb_t on_new_tensor_cb, int n_threads_p, bool enable_mmap) {
     int64_t process_time_ms = 0;
     std::atomic<int64_t> read_time_ms(0);
 
@@ -331,13 +331,6 @@ class ModelLoader {
     bool tensor_should_be_converted(const TensorStorage& tensor_storage, ggml_type type);
     int64_t get_params_mem_size(ggml_backend_t backend, ggml_type type = GGML_TYPE_COUNT);
     ~ModelLoader() = default;
-
-    static std::string load_merges();
-    static std::string load_qwen2_merges();
-    static std::string load_mistral_merges();
-    static std::string load_mistral_vocab_json();
-    static std::string load_t5_tokenizer_json();
-    static std::string load_umt5_tokenizer_json();
 };
 
 #endif  // __MODEL_H__
@@ -2679,7 +2679,7 @@ class StableDiffusionGGML {
                 };
                 sd_tiling_non_square(x, result, vae_scale_factor, tile_size_x, tile_size_y, tile_overlap, on_tiling);
             } else {
-                if(!first_stage_model->compute(n_threads, x, true, &result, work_ctx)){
+                if (!first_stage_model->compute(n_threads, x, true, &result, work_ctx)) {
                     LOG_ERROR("Failed to decode latetnts");
                     first_stage_model->free_compute_buffer();
                     return nullptr;
@@ -2695,7 +2695,7 @@ class StableDiffusionGGML {
                 };
                 sd_tiling(x, result, vae_scale_factor, 64, 0.5f, on_tiling);
             } else {
-                if(!tae_first_stage->compute(n_threads, x, true, &result)){
+                if (!tae_first_stage->compute(n_threads, x, true, &result)) {
                     LOG_ERROR("Failed to decode latetnts");
                     tae_first_stage->free_compute_buffer();
                     return nullptr;
 
@@ -14,6 +14,7 @@
 #include "ggml_extend.hpp"
 #include "json.hpp"
 #include "model.h"
+#include "vocab/vocab.h"
 
 // Port from: https://github.com/google/sentencepiece/blob/master/src/unigram_model.h
 // and https://github.com/google/sentencepiece/blob/master/src/unigram_model.h.
@@ -341,9 +342,9 @@ class T5UniGramTokenizer {
 public:
     explicit T5UniGramTokenizer(bool is_umt5 = false) {
         if (is_umt5) {
-            InitializePieces(ModelLoader::load_umt5_tokenizer_json());
+            InitializePieces(load_umt5_tokenizer_json());
         } else {
-            InitializePieces(ModelLoader::load_t5_tokenizer_json());
+            InitializePieces(load_t5_tokenizer_json());
         }
 
         min_score_ = FLT_MAX;
Original file line number	Diff line number	Diff line change
`@@ -90,6 +90,8 @@ file(GLOB SD_LIB_SOURCES`
`90`	`90`	`"src/*.h"`
`91`	`91`	`"src/*.cpp"`
`92`	`92`	`"src/*.hpp"`
	`93`	`+ "src/vocab/*.h"`
	`94`	`+ "src/vocab/*.cpp"`
`93`	`95`	`)`
`94`	`96`
`95`	`97`	`find_program(GIT_EXE NAMES git git.exe NO_CMAKE_FIND_ROOT_PATH)`
Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,4 @@`
`1`		`-for f in .cpp .h .hpp examples/cli/.cpp examples/common/.hpp examples/cli/.h examples/server/*.cpp; do`
	`1`	`+for f in src/.cpp src/.h src/.hpp src/vocab/.h src/vocab/.cpp examples/cli/.cpp examples/common/.hpp examples/cli/.h examples/server/*.cpp; do`
`2`	`2`	`[[ "$f" == vocab* ]] && continue`
`3`	`3`	`echo "formatting '$f'"`
`4`	`4`	`# if [ "$f" != "stable-diffusion.h" ]; then`
Original file line number	Diff line number	Diff line change
`@@ -19,6 +19,7 @@`
`19`	`19`	`#include "json.hpp"`
`20`	`20`	`#include "rope.hpp"`
`21`	`21`	`#include "tokenize_util.h"`
	`22`	`+#include "vocab/vocab.h"`
`22`	`23`
`23`	`24`	`namespace LLM {`
`24`	`25`	`constexpr int LLM_GRAPH_SIZE = 10240;`
`@@ -365,7 +366,7 @@ namespace LLM {`
`365`	`366`	`if (merges_utf8_str.size() > 0) {`
`366`	`367`	`load_from_merges(merges_utf8_str);`
`367`	`368`	`} else {`
`368`		`- load_from_merges(ModelLoader::load_qwen2_merges());`
	`369`	`+ load_from_merges(load_qwen2_merges());`
`369`	`370`	`}`
`370`	`371`	`}`
`371`	`372`	`};`
`@@ -466,7 +467,7 @@ namespace LLM {`
`466`	`467`	`if (merges_utf8_str.size() > 0 && vocab_utf8_str.size() > 0) {`
`467`	`468`	`load_from_merges(merges_utf8_str, vocab_utf8_str);`
`468`	`469`	`} else {`
`469`		`- load_from_merges(ModelLoader::load_mistral_merges(), ModelLoader::load_mistral_vocab_json());`
	`470`	`+ load_from_merges(load_mistral_merges(), load_mistral_vocab_json());`
`470`	`471`	`}`
`471`	`472`	`}`
`472`	`473`	`};`