diff --git a/openllm-python/src/openllm/_llm.py b/openllm-python/src/openllm/_llm.py index d8457885..8bc35318 100644 --- a/openllm-python/src/openllm/_llm.py +++ b/openllm-python/src/openllm/_llm.py @@ -184,8 +184,8 @@ class LLM(t.Generic[M, T]): adapter_map=convert_peft_config_type(adapter_map) if adapter_map is not None else None, serialisation=serialisation, local=_local, - max_model_len=getenv('max_model_len', default=max_model_len), - gpu_memory_utilization=getenv('gpu_memory_utilization', default=gpu_memory_utilization), + max_model_len=max_model_len, + gpu_memory_utilization=gpu_memory_utilization, LLM__model_attrs=model_attrs, LLM__tokenizer_attrs=tokenizer_attrs, llm_dtype__=dtype.lower(),