mirror of
https://github.com/bentoml/OpenLLM.git
synced 2026-02-08 06:42:20 -05:00
fix(memory): correctly recommend instance types for cloud
Signed-off-by: paperspace <29749331+aarnphm@users.noreply.github.com>
This commit is contained in:
@@ -436,7 +436,7 @@ def build_command(
|
||||
service_config = dict(
|
||||
resources={
|
||||
'gpu' if device else 'cpu': len(device) if device else '1',
|
||||
'gpu_type': recommended_instance_type(model_id, bentomodel),
|
||||
'gpu_type': recommended_instance_type(model_id, bentomodel, serialisation),
|
||||
},
|
||||
traffic=dict(timeout=timeout),
|
||||
)
|
||||
|
||||
Reference in New Issue
Block a user