@@ -142,6 +142,7 @@ def __init__(
142
142
143
143
self .gpu_id = gpu_id
144
144
self .cache_info = dict ()
145
+ self .dp_rank_id = local_data_parallel_id
145
146
146
147
layerwise_send_cache_thread = threading .Thread (target = self ._prefill_layerwise_send_cache_thread )
147
148
layerwise_send_cache_thread .daemon = True
@@ -159,29 +160,29 @@ def _prefill_layerwise_send_cache_thread(self):
159
160
prefilled_layer_idx_data = np .zeros (shape = [1 ], dtype = np .int32 )
160
161
try :
161
162
step_shm_value = IPCSignal (
162
- name = f"splitwise_complete_prefilled_step_{ self .rank } " ,
163
+ name = f"splitwise_complete_prefilled_step_{ self .dp_rank_id } " ,
163
164
array = prefilled_step_idx_data ,
164
165
dtype = np .int32 ,
165
166
suffix = self .gpu_id ,
166
167
create = True ,
167
168
)
168
169
layer_shm_value = IPCSignal (
169
- name = f"splitwise_complete_prefilled_layer_{ self .rank } " ,
170
+ name = f"splitwise_complete_prefilled_layer_{ self .dp_rank_id } " ,
170
171
array = prefilled_layer_idx_data ,
171
172
dtype = np .int32 ,
172
173
suffix = self .gpu_id ,
173
174
create = True ,
174
175
)
175
176
except :
176
177
step_shm_value = IPCSignal (
177
- name = f"splitwise_complete_prefilled_step_{ self .rank } " ,
178
+ name = f"splitwise_complete_prefilled_step_{ self .dp_rank_id } " ,
178
179
array = prefilled_step_idx_data ,
179
180
dtype = np .int32 ,
180
181
suffix = self .gpu_id ,
181
182
create = False ,
182
183
)
183
184
layer_shm_value = IPCSignal (
184
- name = f"splitwise_complete_prefilled_layer_{ self .rank } " ,
185
+ name = f"splitwise_complete_prefilled_layer_{ self .dp_rank_id } " ,
185
186
array = prefilled_layer_idx_data ,
186
187
dtype = np .int32 ,
187
188
suffix = self .gpu_id ,
0 commit comments