@@ -73,12 +73,6 @@ class CachedRequestState:
7373 lora_request : Optional [LoRARequest ] = None
7474 prompt_embeds : Optional [torch .Tensor ] = None
7575
76- # pcp/dcp param
77- local_chunked_kv_lens : Optional [list [Optional [list [Optional [
78- list [int ]]]]]] = None # Records computed tokens for each chunk
79- next_pcp_dcp_start_rank : int = 0 # Tracks next starting rank for round-robin distribution
80- token_blank_in_last_blk : int = 0 # if the last block is not full, how many future tokens can be stored
81-
8276 def __post_init__ (self ):
8377 self .num_prompt_tokens = length_from_prompt_token_ids_or_embeds (
8478 self .prompt_token_ids , self .prompt_embeds )
@@ -319,10 +313,6 @@ def __init__(
319313 self .prev_sampled_token_ids_invalid_indices : Optional [set [int ]] = None
320314 self .prev_req_id_to_index : Optional [dict [str , int ]] = None
321315
322- # pcp/dcp parameters
323- self .local_chunked_kv_lens : list [Optional [list [Optional [list [Optional [
324- list [int ]]]]]]] = [None ] * max_num_reqs
325-
326316 @property
327317 def req_ids (self ) -> list [str ]:
328318 # None elements should only be present transiently
@@ -395,9 +385,6 @@ def add_request(
395385 self .num_computed_tokens_cpu [req_index ] = request .num_computed_tokens
396386 self .block_table .add_row (request .block_ids , req_index )
397387
398- # Add PCP/DCP tracking fields
399- self .local_chunked_kv_lens [req_index ] = request .local_chunked_kv_lens
400-
401388 if sampling_params := request .sampling_params :
402389 if (self .is_spec_decode
403390 and is_spec_decode_unsupported (sampling_params )):
@@ -693,8 +680,6 @@ def condense(self) -> None:
693680 last_req_index ]
694681 self .num_computed_tokens_cpu [
695682 empty_index ] = self .num_computed_tokens_cpu [last_req_index ]
696- self .local_chunked_kv_lens [
697- empty_index ] = self .local_chunked_kv_lens [last_req_index ]
698683 self .block_table .move_row (last_req_index , empty_index )
699684 self .temperature_cpu [empty_index ] = self .temperature_cpu [
700685 last_req_index ]
0 commit comments