@@ -34,6 +34,8 @@ limitations under the License.
3434
3535namespace xllm {
3636
37+ constexpr uint32_t COPY_BATCH_SIZE = 1 ;
38+
3739WorkerService::WorkerService (runtime::Options options,
3840 const torch::Device& device)
3941 : options_(options), device_(device), initialized_(false ) {
@@ -490,7 +492,7 @@ void WorkerService::PrefetchFromStorage(
490492 std::vector<BlockTransferInfo> block_transfer_info;
491493 proto_to_block_transfer_info (*req, block_transfer_info);
492494
493- copy_threadpool_ .schedule (
495+ BThreadPool::get_instance () .schedule (
494496 [this ,
495497 block_transfer_info = std::move (block_transfer_info),
496498 stream_id = std::move (stream_id),
@@ -499,15 +501,14 @@ void WorkerService::PrefetchFromStorage(
499501 auto close_future = stream_handler->get_close_future ();
500502 bool is_completed = false ;
501503
502- for (size_t i = 0 ; i < transfer_slice.size ();
503- i += stream_copy_batch_size_) {
504+ for (size_t i = 0 ; i < transfer_slice.size (); i += COPY_BATCH_SIZE) {
504505 auto current_slice = transfer_slice.slice (
505- i, std::min (i + stream_copy_batch_size_ , transfer_slice.size ()));
506+ i, std::min (i + COPY_BATCH_SIZE , transfer_slice.size ()));
506507
507508 auto success_cnt = worker_->prefetch_from_storage (current_slice);
508509
509510 if (success_cnt != current_slice.size () ||
510- i + stream_copy_batch_size_ >= transfer_slice.size ()) {
511+ i + COPY_BATCH_SIZE >= transfer_slice.size ()) {
511512 is_completed = true ;
512513 }
513514
0 commit comments