mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 12:24:53 +00:00
add log
This commit is contained in:
parent
8260dc00d8
commit
ca20c304b3
@ -779,6 +779,7 @@ class FlashCausalLM(Model):
|
|||||||
|
|
||||||
if os.getenv("ENABLE_CUDA_GRAPHS", "False") == "True":
|
if os.getenv("ENABLE_CUDA_GRAPHS", "False") == "True":
|
||||||
try:
|
try:
|
||||||
|
logger.info("Experimental support for Cuda Graphs is enabled")
|
||||||
# Warmup cuda graphs for all power of twos until 64
|
# Warmup cuda graphs for all power of twos until 64
|
||||||
for i in range(6):
|
for i in range(6):
|
||||||
self.cuda_graph_warmup(2**i, max_s, max_bt)
|
self.cuda_graph_warmup(2**i, max_s, max_bt)
|
||||||
|
Loading…
Reference in New Issue
Block a user