fix(memory): correctly recommend instance types for cloud

Signed-off-by: paperspace <29749331+aarnphm@users.noreply.github.com>
This commit is contained in:
paperspace
2024-05-23 14:42:39 +00:00
parent db523e2940
commit cec0aa5487
3 changed files with 25 additions and 8 deletions

View File

@@ -436,7 +436,7 @@ def build_command(
service_config = dict(
resources={
'gpu' if device else 'cpu': len(device) if device else '1',
'gpu_type': recommended_instance_type(model_id, bentomodel),
'gpu_type': recommended_instance_type(model_id, bentomodel, serialisation),
},
traffic=dict(timeout=timeout),
)