mirror of
https://github.com/bentoml/OpenLLM.git
synced 2026-05-03 13:22:43 -04:00
fix(gpus): disable slots for now to enable cached_property
Signed-off-by: Aaron <29749331+aarnphm@users.noreply.github.com>
This commit is contained in:
@@ -45,7 +45,7 @@ _AdapterTuple: type[AdapterTuple] = codegen.make_attr_tuple_class('AdapterTuple'
|
||||
ResolvedAdapterMap = t.Dict[AdapterType, t.Dict[str, t.Tuple['PeftConfig', str]]]
|
||||
|
||||
|
||||
@attr.define(slots=True, repr=False, init=False)
|
||||
@attr.define(slots=False, repr=False, init=False)
|
||||
class LLM(t.Generic[M, T]):
|
||||
async def generate(
|
||||
self, prompt, prompt_token_ids=None, stop=None, stop_token_ids=None, request_id=None, adapter_name=None, **attrs
|
||||
|
||||
Reference in New Issue
Block a user