fix typo (#769)

2f80c556 · q.yao · GitHub · 7868cea5 · 2f80c556 · 2f80c556
Unverified Commit 2f80c556 authored Nov 28, 2023 by q.yao Committed by GitHub Nov 28, 2023
Hide whitespace changes
Inline Side-by-side

Showing with 3 additions and 3 deletions

src/turbomind/models/llama/LlamaV2.cc src/turbomind/models/llama/LlamaV2.cc +2 -2

src/turbomind/models/llama/LlamaV2.h src/turbomind/models/llama/LlamaV2.h +1 -1

No files found.
--- a/src/turbomind/models/llama/LlamaV2.cc
+++ b/src/turbomind/models/llama/LlamaV2.cc
@@ -218,7 +218,7 @@ void LlamaV2<T>::embeddingLookup(T* embeddings, const int* token_ids_buf, int ba
 }

 template<typename T>
-void LlamaV2<T>::contextDecode(T*           deocder_output,
+void LlamaV2<T>::contextDecode(T*           decoder_output,
                               uintptr_t*   k_cache_ptr,
                               uintptr_t*   v_cache_ptr,
                               void**       tmp_k_ptrs,
@@ -280,7 +280,7 @@ void LlamaV2<T>::contextDecode(T*           deocder_output,
        {"value_cache", {MEMORY_GPU, TYPE_UINT64, {bsz}, v_cache_ptr}},
        {"tmp_k", {MEMORY_GPU, TYPE_UINT64, {bsz}, tmp_k_ptrs}},
        {"tmp_v", {MEMORY_GPU, TYPE_UINT64, {bsz}, tmp_v_ptrs}},
-        {"last_token_hidden_units", {MEMORY_GPU, dtype, {bsz, hidden_units_}, deocder_output}}};
+        {"last_token_hidden_units", {MEMORY_GPU, dtype, {bsz, hidden_units_}, decoder_output}}};

    context_decoder_->forward(&decoder_output_tensors, &decoder_input_tensors, &weights_->decoder_layer_weights);


--- a/src/turbomind/models/llama/LlamaV2.h
+++ b/src/turbomind/models/llama/LlamaV2.h
@@ -113,7 +113,7 @@ private:

    void embeddingLookup(T* embeddings, const int* token_ids_buf, int batch_size, int step);

-    void contextDecode(T*           deocder_output,
+    void contextDecode(T*           decoder_output,
                       uintptr_t*   k_block_ptrs,
                       uintptr_t*   v_block_ptrs,
                       void**       k_tmp_ptrs,