Skip to content

Commit fe17410

Browse files
[BUG] Fix bug for pd in fd (#3034)
* Fix bug for pd in fd * Fix bug for pd in fd --------- Co-authored-by: Jiang-Jia-Jun <163579578+Jiang-Jia-Jun@users.noreply.github.com>
1 parent 1a543bc commit fe17410

File tree

2 files changed

+6
-5
lines changed

2 files changed

+6
-5
lines changed

fastdeploy/cache_manager/cache_messager.py

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -142,6 +142,7 @@ def __init__(
142142

143143
self.gpu_id = gpu_id
144144
self.cache_info = dict()
145+
self.dp_rank_id = local_data_parallel_id
145146

146147
layerwise_send_cache_thread = threading.Thread(target=self._prefill_layerwise_send_cache_thread)
147148
layerwise_send_cache_thread.daemon = True
@@ -159,29 +160,29 @@ def _prefill_layerwise_send_cache_thread(self):
159160
prefilled_layer_idx_data = np.zeros(shape=[1], dtype=np.int32)
160161
try:
161162
step_shm_value = IPCSignal(
162-
name=f"splitwise_complete_prefilled_step_{self.rank}",
163+
name=f"splitwise_complete_prefilled_step_{self.dp_rank_id}",
163164
array=prefilled_step_idx_data,
164165
dtype=np.int32,
165166
suffix=self.gpu_id,
166167
create=True,
167168
)
168169
layer_shm_value = IPCSignal(
169-
name=f"splitwise_complete_prefilled_layer_{self.rank}",
170+
name=f"splitwise_complete_prefilled_layer_{self.dp_rank_id}",
170171
array=prefilled_layer_idx_data,
171172
dtype=np.int32,
172173
suffix=self.gpu_id,
173174
create=True,
174175
)
175176
except:
176177
step_shm_value = IPCSignal(
177-
name=f"splitwise_complete_prefilled_step_{self.rank}",
178+
name=f"splitwise_complete_prefilled_step_{self.dp_rank_id}",
178179
array=prefilled_step_idx_data,
179180
dtype=np.int32,
180181
suffix=self.gpu_id,
181182
create=False,
182183
)
183184
layer_shm_value = IPCSignal(
184-
name=f"splitwise_complete_prefilled_layer_{self.rank}",
185+
name=f"splitwise_complete_prefilled_layer_{self.dp_rank_id}",
185186
array=prefilled_layer_idx_data,
186187
dtype=np.int32,
187188
suffix=self.gpu_id,

fastdeploy/cache_manager/transfer_factory/rdma_cache_transfer.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -45,7 +45,7 @@ def __init__(
4545
return
4646
self.messager = rdma_comm.RDMACommunicator(
4747
splitwise_role,
48-
rank,
48+
gpu_id,
4949
str(rdma_port) if splitwise_role == "decode" else "0",
5050
cache_k_ptr_list,
5151
cache_v_ptr_list,

0 commit comments

Comments
 (0)