llama : std::move llm_bigram_bpe from work_queue (#9062)

author Daniel Bevenius <redacted>

Wed, 21 Aug 2024 07:32:58 +0000 (09:32 +0200)

committer GitHub <redacted>

Wed, 21 Aug 2024 07:32:58 +0000 (10:32 +0300)
author Daniel Bevenius <redacted>
Wed, 21 Aug 2024 07:32:58 +0000 (09:32 +0200)
committer GitHub <redacted>
Wed, 21 Aug 2024 07:32:58 +0000 (10:32 +0300)
diff --git a/src/llama-vocab.cpp b/src/llama-vocab.cpp

index 17deefaa860381d64221f04043499d7312d56e30..323660ef54cb07a7c90f15d86620583375754fc3 100644 (file)
--- a/src/llama-vocab.cpp
+++ b/src/llama-vocab.cpp
@@ -321,6 +321,21 @@ private:
  
  // TODO: there are a lot of common parts between spm and bpe tokenizers, should be refactored and reused
  
+template<typename T, typename Container = std::vector<T>, typename Compare = std::less<typename Container::value_type>>
+class llama_priority_queue : public std::priority_queue<T, Container, Compare> {
+public:
+    using std::priority_queue<T, Container, Compare>::priority_queue;
+
+    T pop_move() {
+        T item = std::move(this->c.front());
+        std::pop_heap(this->c.begin(), this->c.end(), this->comp);
+        this->c.pop_back();
+        return item;
+    }
+
+    void pop() =  delete;
+};
+
  struct llm_bigram_bpe {
      struct comparator {
          bool operator()(const llm_bigram_bpe & l, const llm_bigram_bpe & r) const {
@@ -329,7 +344,7 @@ struct llm_bigram_bpe {
      };
  
      using queue_storage = std::vector<llm_bigram_bpe>;
-    using queue = std::priority_queue<llm_bigram_bpe, queue_storage, comparator>;
+    using queue = llama_priority_queue<llm_bigram_bpe, queue_storage, comparator>;
      llm_symbol::index left;
      llm_symbol::index right;
      std::string text;
@@ -520,8 +535,7 @@ struct llm_tokenizer_bpe {
  
              // build token(s)
              while (!work_queue.empty()) {
-                auto bigram = work_queue.top();
-                work_queue.pop();
+                auto bigram = work_queue.pop_move();
  
                  auto & left_symbol = symbols[bigram.left];
                  auto & right_symbol = symbols[bigram.right];
author	Daniel Bevenius <redacted>
	Wed, 21 Aug 2024 07:32:58 +0000 (09:32 +0200)
committer	GitHub <redacted>
	Wed, 21 Aug 2024 07:32:58 +0000 (10:32 +0300)