@@ -612,9 +612,9 @@ std::vector<Batch> ContinuousScheduler::prepare_batch() {
612
612
while (request_queue_.read (request)) {
613
613
CHECK (request);
614
614
615
- if (request->offline ()) {
616
- DLOG << " Read an offline request from request_queue_" ;
617
- }
615
+ // if (request->offline()) {
616
+ // DVLOG << "Read an offline request from request_queue_";
617
+ // }
618
618
619
619
// expand sequences to the target number if prefix cache is disabled.
620
620
if (!enable_prefix_cache_) {
@@ -625,10 +625,12 @@ std::vector<Batch> ContinuousScheduler::prepare_batch() {
625
625
if (request->sequences ()[0 ]->kv_state ().kv_cache_tokens_num () == 0 ) {
626
626
if (request->offline ()) {
627
627
waiting_priority_queue_offline_.push (request);
628
- DLOG << " Put an offline request into waiting_priority_queue_offline_" ;
628
+ // DVLOG << "Put an offline request into
629
+ // waiting_priority_queue_offline_";
629
630
} else {
630
631
waiting_priority_queue_.push (request);
631
- DLOG << " Put an online request into waiting_priority_queue_offline_" ;
632
+ // DVLOG << "Put an online request into
633
+ // waiting_priority_queue_offline_";
632
634
}
633
635
} else {
634
636
// request from prefill instance in disagge pd mode.
@@ -646,7 +648,7 @@ std::vector<Batch> ContinuousScheduler::prepare_batch() {
646
648
std::shared_ptr<Request> request = *it;
647
649
request->update_connection_status ();
648
650
if (request->finished () || request->cancelled ()) {
649
- DLOG << " Found a finished request in running_requests_" ;
651
+ // DVLOG << "Found a finished request in running_requests_";
650
652
block_manager_pool_->deallocate (request.get ());
651
653
// release the ownership of the request
652
654
finished_requests.emplace_back (request);
@@ -671,10 +673,10 @@ std::vector<Batch> ContinuousScheduler::prepare_batch() {
671
673
handle_running_requests (*it);
672
674
if ((*it)->offline ()) {
673
675
running_queue_offline_->push (*it, last_step_prefill_);
674
- DLOG << " Put an offline request into running_queue_offline_" ;
676
+ // DVLOG << "Put an offline request into running_queue_offline_";
675
677
} else {
676
678
running_queue_->push (*it, last_step_prefill_);
677
- DLOG << " Put an online request into running_queue_" ;
679
+ // DVLOG << "Put an online request into running_queue_";
678
680
}
679
681
}
680
682
} else {
@@ -697,16 +699,17 @@ std::vector<Batch> ContinuousScheduler::prepare_batch() {
697
699
handle_running_requests (*it);
698
700
if ((*it)->offline ()) {
699
701
running_queue_offline_->push (*it, last_step_prefill_);
700
- DLOG << " Pushed an offline request into running_queue_offline_" ;
702
+ // DVLOG << "Pushed an offline request into running_queue_offline_";
701
703
} else {
702
704
running_queue_->push (*it, last_step_prefill_);
703
- DLOG << " Pushed an online request into running_queue_" ;
705
+ // DVLOG << "Pushed an online request into running_queue_";
704
706
}
705
707
}
706
708
}
707
709
} else {
708
- DLOG << " Using unknown priority_strategy: " << options_.priority_strategy ();
709
- // directly push running requests to the priority queue
710
+ // DVLOG << "Using unknown priority_strategy: " <<
711
+ // options_.priority_strategy(); directly push running requests to the
712
+ // priority queue
710
713
for (auto it = running_requests_.begin (); it != running_requests_.end ();
711
714
++it) {
712
715
if (*it == nullptr ) {
@@ -715,10 +718,10 @@ std::vector<Batch> ContinuousScheduler::prepare_batch() {
715
718
handle_running_requests (*it);
716
719
if ((*it)->offline ()) {
717
720
running_queue_offline_->push (*it);
718
- DLOG << " Pushed an offline request into running_queue_offline_" ;
721
+ // DVLOG << "Pushed an offline request into running_queue_offline_";
719
722
} else {
720
723
running_queue_->push (*it);
721
- DLOG << " Pushed an online request into running_queue_" ;
724
+ // DVLOG << "Pushed an online request into running_queue_";
722
725
}
723
726
}
724
727
}
@@ -827,7 +830,7 @@ std::vector<Batch> ContinuousScheduler::prepare_batch() {
827
830
GAUGE_SET (num_free_blocks, util::max (block_manager_pool_->num_free_blocks ()));
828
831
GAUGE_SET (num_used_blocks, util::min (block_manager_pool_->num_used_blocks ()));
829
832
if (!batches[0 ].empty ()) {
830
- DLOG << " Built a batch" ;
833
+ DVLOG << " Built a batch" ;
831
834
}
832
835
return batches;
833
836
}
0 commit comments