修复batch推理bug

2cec992f · zhouxiang · 15d855b9 · 2cec992f
Commit 2cec992f authored Nov 15, 2023 by zhouxiang
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 2 deletions

package/fastllm_pytools/llm.py package/fastllm_pytools/llm.py +2 -2

No files found.
--- a/package/fastllm_pytools/llm.py
+++ b/package/fastllm_pytools/llm.py
@@ -483,7 +483,7 @@ class model:
            response = ctypes.string_at(outputs[i]).decode()
            responses.append(response)
            historys[i] = historys[i] + [(querys[i], response)]
-        fastllm_lib.freeCharArray(outputs)
+        fastllm_lib.freeCharArray(outputs, query_size)
        return responses, historys

    def chat_batch(self, tokenizer, querys: List[str], historys: List[List[Tuple[str, str]]] = None, max_length: int = 1024,
@@ -511,7 +511,7 @@ class model:
                response = ctypes.string_at(outputs[i]).decode()
                responses.append(response)
                historys[i] = historys[i] + [(querys[i], response)]
-            fastllm_lib.freeCharArray(outputs)
+            fastllm_lib.freeCharArray(outputs, query_size)
            return responses, historys