@@ -49,6 +49,11 @@ std::vector<std::string> XllmRpcServiceImpl::get_static_decode_list(
4949 return scheduler_->get_static_decode_list (instance_name);
5050}
5151
52+ std::vector<std::string> XllmRpcServiceImpl::get_static_prefill_list (
53+ const std::string& instance_name) {
54+ return scheduler_->get_static_prefill_list (instance_name);
55+ }
56+
5257bool XllmRpcServiceImpl::handle_generation (
5358 const llm::RequestOutput& request_output) {
5459 return scheduler_->handle_generation (request_output);
@@ -126,6 +131,19 @@ void XllmRpcService::GetStaticDecodeList(
126131 }
127132}
128133
134+ void XllmRpcService::GetStaticPrefillList (
135+ google::protobuf::RpcController* cntl_base,
136+ const proto::InstanceID* req,
137+ proto::InstanceIDs* resp,
138+ google::protobuf::Closure* done) {
139+ brpc::ClosureGuard done_guard (done);
140+ std::vector<std::string> prefill_list =
141+ xllm_rpc_service_impl_->get_static_prefill_list (req->name ());
142+ for (auto & p : prefill_list) {
143+ *(resp->mutable_names ()->Add ()) = std::move (p);
144+ }
145+ }
146+
129147void XllmRpcService::Generations (google::protobuf::RpcController* cntl_base,
130148 const proto::DisaggStreamGenerations* req,
131149 proto::StatusSet* resp,
0 commit comments