Skip to content

Commit 823f628

Browse files
authored
Enable parallel instance loading backend attribute (triton-inference-server#284)
1 parent d9de83e commit 823f628

File tree

1 file changed

+5
-0
lines changed

1 file changed

+5
-0
lines changed

src/python_be.cc

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2274,6 +2274,11 @@ TRITONBACKEND_GetBackendAttribute(
22742274
backend_attributes, TRITONSERVER_INSTANCEGROUPKIND_CPU, 0, nullptr, 0));
22752275
#endif
22762276

2277+
// This backend can safely handle parallel calls to
2278+
// TRITONBACKEND_ModelInstanceInitialize (thread-safe).
2279+
RETURN_IF_ERROR(TRITONBACKEND_BackendAttributeSetParallelModelInstanceLoading(
2280+
backend_attributes, true));
2281+
22772282
return nullptr;
22782283
}
22792284

0 commit comments

Comments
 (0)