EeyoreLee · EeyoreLee · Oct 12, 2024 · Oct 12, 2024
diff --git a/src/bert.cpp b/src/bert.cpp
@@ -64,6 +64,8 @@ void bert_batch_tokens::init_input_ids(std::vector<std::vector<int>> &input_ids,
 {
     static std::vector<bert_vocab_id> flat{};
     static std::vector<int32_t> mask{};
+    flat.clear();
+    mask.clear();
     for (const auto &ids : input_ids)
     {
         flat.insert(flat.end(), ids.begin(), ids.end());

diff --git a/test/test_batch_inference.cpp b/test/test_batch_inference.cpp
@@ -7,7 +7,7 @@
 int main(int argc, char **argv)
 {
     const std::string path = "/media/E/lichunyu/bert.cpp/data/test_tokenizer/tokenizer.json";
-    const std::string fname = "/media/E/lichunyu/bert.cpp/data/ggml-model/ggml_model.gguf";
+    const std::string fname = "/media/E/lichunyu/bert.cpp/data/ggml-model/ggml_model.ggml";
     const std::string text1 = "卫生间抽纸";
     const std::string text2 = "卫生间抽纸";
     const std::string text3 = "卫生间抽纸";

diff --git a/test/test_inference.cpp b/test/test_inference.cpp
@@ -7,7 +7,7 @@
 int main(int argc, char **argv)
 {
     const std::string path = "/media/E/lichunyu/bert.cpp/data/test_tokenizer/tokenizer.json";
-    const std::string fname = "/media/E/lichunyu/bert.cpp/data/ggml-model/ggml_model.gguf";
+    const std::string fname = "/media/E/lichunyu/bert.cpp/data/ggml-model/ggml_model.ggml";
     auto start_cpp_total = std::chrono::high_resolution_clock::now();
     bert_ctx *ctx = new bert_ctx();
     bert_model_load_from_ggml(fname, ctx->model);

diff --git a/test/test_model_load.cpp b/test/test_model_load.cpp
@@ -5,7 +5,7 @@
 int main(int argc, char **argv)
 {
     bert_model model;
-    std::string fname = "/media/E/lichunyu/bert.cpp/data/ggml-model/ggml_model.gguf";
+    std::string fname = "/media/E/lichunyu/bert.cpp/data/ggml-model/ggml_model.ggml";
     if (!bert_model_load_from_ggml(fname, model))
     {
         fprintf(stderr, "%s: failed to load model from %s", __func__, fname.c_str());

diff --git a/test/test_py_entrance.cpp b/test/test_py_entrance.cpp
@@ -2,7 +2,7 @@
 
 int main(int argc, char **argv)
 {
-    const char *fname = "/media/E/lichunyu/bert.cpp/data/ggml-model/ggml_model.gguf";
+    const char *fname = "/media/E/lichunyu/bert.cpp/data/ggml-model/ggml_model.ggml";
     const char *tokenizer_json_fname = "/media/E/lichunyu/bert.cpp/data/test_tokenizer/tokenizer.json";
     int32_t buf_compute = 320;
     bert_ctx *ctx = py_bert_ctx_load_from_file(fname, tokenizer_json_fname, buf_compute);