Unverified Commit e03ddcfb authored by Akash kaothalkar's avatar Akash kaothalkar Committed by GitHub
Browse files

[Hardware][Powerpc]Enable prefix caching and chunked prefill for ppc64le (#35081)


Signed-off-by: default avatarAkash kaothalkar <akash.kaothalkar@ibm.com>
Co-authored-by: default avatarAkash kaothalkar <akash.kaothalkar@ibm.com>
parent 02acd168
...@@ -2076,20 +2076,19 @@ class EngineArgs: ...@@ -2076,20 +2076,19 @@ class EngineArgs:
) )
# Disable chunked prefill and prefix caching for: # Disable chunked prefill and prefix caching for:
# POWER (ppc64le)/RISCV CPUs in V1 # RISCV CPUs in V1
if current_platform.is_cpu() and current_platform.get_cpu_architecture() in ( if current_platform.is_cpu() and current_platform.get_cpu_architecture() in (
CpuArchEnum.POWERPC,
CpuArchEnum.RISCV, CpuArchEnum.RISCV,
): ):
logger.info( logger.info(
"Chunked prefill is not supported for POWER, " "Chunked prefill is not supported for"
"and RISC-V CPUs; " "RISC-V CPUs; "
"disabling it for V1 backend." "disabling it for V1 backend."
) )
self.enable_chunked_prefill = False self.enable_chunked_prefill = False
logger.info( logger.info(
"Prefix caching is not supported for POWER, " "Prefix caching is not supported for "
"and RISC-V CPUs; " "RISC-V CPUs; "
"disabling it for V1 backend." "disabling it for V1 backend."
) )
self.enable_prefix_caching = False self.enable_prefix_caching = False
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment