mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-12 04:44:52 +00:00
MODEL_ID propagation fix
This commit is contained in:
parent
a895029424
commit
02b0eaaba0
@ -46,6 +46,7 @@ from text_generation_server.models.globals import (
|
||||
get_adapter_to_index,
|
||||
MODEL_ID,
|
||||
)
|
||||
import text_generation_server.models.globals as globals_vars
|
||||
from text_generation_server.layers.attention import Seqlen
|
||||
from text_generation_server.utils import StoppingCriteria, HeterogeneousNextTokenChooser
|
||||
from text_generation_server.utils.dist import MEMORY_FRACTION
|
||||
@ -1157,7 +1158,7 @@ class FlashCausalLM(Model):
|
||||
|
||||
tunableop_filepath = os.path.join(
|
||||
HUGGINGFACE_HUB_CACHE,
|
||||
f"tunableop_{MODEL_ID.replace('/', '-')}_tp{self.world_size}_rank{self.rank}.csv",
|
||||
f"tunableop_{globals_vars.MODEL_ID.replace('/', '-')}_tp{self.world_size}_rank{self.rank}.csv",
|
||||
)
|
||||
|
||||
log_master(
|
||||
|
Loading…
Reference in New Issue
Block a user