Skip to content

Commit 9baa5a2

Browse files
Add option to allow resplitting for priority aware scheduler.
PiperOrigin-RevId: 897839389
1 parent 824ad7a commit 9baa5a2

2 files changed

Lines changed: 6 additions & 0 deletions

File tree

tensorflow_serving/servables/tensorflow/tfrt_saved_model_factory.cc

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -245,6 +245,8 @@ absl::StatusOr<tfrt::SavedModel::Options> CreateCommonSavedModelOptions(
245245
// Open Source TensorFlow r2.20 release.
246246
compile_options.enable_priority_aware_batch_scheduler =
247247
config.enable_priority_aware_batch_scheduler();
248+
compile_options.enable_priority_aware_batch_scheduler_resplit =
249+
config.enable_priority_aware_batch_scheduler_resplit();
248250
#endif
249251

250252
compile_options.batch_padding_policy = config.batch_padding_policy();

tensorflow_serving/servables/tensorflow/tfrt_saved_model_source_adapter.proto

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -257,6 +257,10 @@ message TfrtSavedModelConfig {
257257
// Requests with higher priority will be scheduled into batches before
258258
// lower priority requests.
259259
bool enable_priority_aware_batch_scheduler = 2033;
260+
261+
// If true, the priority aware batch scheduler will resplit tasks into
262+
// smaller batches if needed.
263+
bool enable_priority_aware_batch_scheduler_resplit = 2034;
260264
}
261265

262266
// Config proto for TfrtSavedModelSourceAdapter.

0 commit comments

Comments
 (0)