Optimize cuda execution to run in single stream

This commit is contained in:
Nicolas Mowen 2025-09-03 07:31:38 -06:00
parent bd255362d6
commit c308d14587

View File

@ -306,6 +306,7 @@ def get_ort_providers(
options.append(
{
"arena_extend_strategy": "kSameAsRequested",
"use_ep_level_unified_stream": True,
"device_id": device_id,
}
)