Skip to content

Commit 96e8cbe

Browse files
committed
First step on fixing the BTL API conversion for the SMCUDA BTL
Signed-off-by: George Bosilca <bosilca@icl.utk.edu>
1 parent 1f237f5 commit 96e8cbe

File tree

4 files changed

+16
-25
lines changed

4 files changed

+16
-25
lines changed

ompi/mca/pml/ob1/pml_ob1_recvfrag.c

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -624,10 +624,10 @@ void mca_pml_ob1_recv_frag_callback_frag (mca_btl_base_module_t *btl,
624624
assert(btl->btl_flags & MCA_BTL_FLAGS_CUDA_COPY_ASYNC_RECV);
625625

626626
/* This will trigger the opal_convertor_pack to start asynchronous copy. */
627-
mca_pml_ob1_recv_request_frag_copy_start(recvreq,btl,segments,descriptor->des_segment_count,des);
627+
mca_pml_ob1_recv_request_frag_copy_start(recvreq, btl, segments, descriptor->des_segment_count, NULL);
628628

629629
/* Let BTL know that it CANNOT free the frag */
630-
descriptor->des_flags |= MCA_BTL_DES_FLAGS_CUDA_COPY_ASYNC;
630+
//TODO: GB: descriptor->des_flags |= MCA_BTL_DES_FLAGS_CUDA_COPY_ASYNC;
631631

632632
return;
633633
}

ompi/mca/pml/ob1/pml_ob1_recvreq.c

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -577,7 +577,7 @@ void mca_pml_ob1_recv_request_progress_frag( mca_pml_ob1_recv_request_t* recvreq
577577
*/
578578
void mca_pml_ob1_recv_request_frag_copy_start( mca_pml_ob1_recv_request_t* recvreq,
579579
mca_btl_base_module_t* btl,
580-
mca_btl_base_segment_t* segments,
580+
const mca_btl_base_segment_t* segments,
581581
size_t num_segments,
582582
mca_btl_base_descriptor_t* des)
583583
{

ompi/mca/pml/ob1/pml_ob1_recvreq.h

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -332,7 +332,7 @@ void mca_pml_ob1_recv_request_progress_frag(
332332
void mca_pml_ob1_recv_request_frag_copy_start(
333333
mca_pml_ob1_recv_request_t* req,
334334
struct mca_btl_base_module_t* btl,
335-
mca_btl_base_segment_t* segments,
335+
const mca_btl_base_segment_t* segments,
336336
size_t num_segments,
337337
mca_btl_base_descriptor_t* des);
338338

opal/mca/btl/smcuda/btl_smcuda_component.c

Lines changed: 12 additions & 21 deletions
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@
33
* Copyright (c) 2004-2011 The Trustees of Indiana University and Indiana
44
* University Research and Technology
55
* Corporation. All rights reserved.
6-
* Copyright (c) 2004-2009 The University of Tennessee and The University
6+
* Copyright (c) 2004-2020 The University of Tennessee and The University
77
* of Tennessee Research Foundation. All rights
88
* reserved.
99
* Copyright (c) 2004-2005 High Performance Computing Center Stuttgart,
@@ -679,20 +679,15 @@ static void mca_btl_smcuda_send_cuda_ipc_ack(struct mca_btl_base_module_t* btl,
679679
* BTL. It handles smcuda specific control messages that are triggered
680680
* when GPU memory transfers are initiated. */
681681
static void btl_smcuda_control(mca_btl_base_module_t* btl,
682-
mca_btl_base_tag_t tag,
683-
mca_btl_base_descriptor_t* des, void* cbdata)
682+
const mca_btl_base_receive_descriptor_t *descriptor)
684683
{
685684
int mydevnum, ipcaccess, res;
686685
ctrlhdr_t ctrlhdr;
687686
opal_proc_t *ep_proc;
688-
struct mca_btl_base_endpoint_t *endpoint;
689687
mca_btl_smcuda_t *smcuda_btl = (mca_btl_smcuda_t *)btl;
690-
mca_btl_smcuda_frag_t *frag = (mca_btl_smcuda_frag_t *)des;
691-
mca_btl_base_segment_t* segments = des->des_segments;
688+
const mca_btl_base_segment_t* segments = descriptor->des_segments;
689+
struct mca_btl_base_endpoint_t *endpoint = descriptor->endpoint;
692690

693-
/* Use the rank of the peer that sent the data to get to the endpoint
694-
* structure. This is needed for PML callback. */
695-
endpoint = mca_btl_smcuda_component.sm_peers[frag->hdr->my_smp_rank];
696691
ep_proc = endpoint->proc_opal;
697692

698693
/* Copy out control message payload to examine it */
@@ -764,7 +759,6 @@ static void btl_smcuda_control(mca_btl_base_module_t* btl,
764759
}
765760
}
766761

767-
assert(endpoint->peer_smp_rank == frag->hdr->my_smp_rank);
768762
opal_output_verbose(10, mca_btl_smcuda_component.cuda_ipc_output,
769763
"Analyzed CUDA IPC request: myrank=%d, mydev=%d, peerrank=%d, "
770764
"peerdev=%d --> ACCESS=%d",
@@ -999,7 +993,6 @@ int mca_btl_smcuda_component_progress(void)
999993
/* local variables */
1000994
mca_btl_base_segment_t seg;
1001995
mca_btl_smcuda_frag_t *frag;
1002-
mca_btl_smcuda_frag_t Frag;
1003996
sm_fifo_t *fifo = NULL;
1004997
mca_btl_smcuda_hdr_t *hdr;
1005998
int my_smp_rank = mca_btl_smcuda_component.my_smp_rank;
@@ -1046,7 +1039,6 @@ int mca_btl_smcuda_component_progress(void)
10461039
switch(((uintptr_t)hdr) & MCA_BTL_SMCUDA_FRAG_TYPE_MASK) {
10471040
case MCA_BTL_SMCUDA_FRAG_SEND:
10481041
{
1049-
mca_btl_active_message_callback_t* reg;
10501042
/* change the address from address relative to the shared
10511043
* memory address, to a true virtual address */
10521044
hdr = (mca_btl_smcuda_hdr_t *) RELATIVE2VIRTUAL(hdr);
@@ -1058,17 +1050,16 @@ int mca_btl_smcuda_component_progress(void)
10581050
my_smp_rank, peer_smp_rank, j, FIFO_MAP(peer_smp_rank));
10591051
}
10601052
#endif
1061-
/* recv upcall */
1062-
reg = mca_btl_base_active_message_trigger + hdr->tag;
10631053
seg.seg_addr.pval = ((char *)hdr) + sizeof(mca_btl_smcuda_hdr_t);
10641054
seg.seg_len = hdr->len;
1065-
Frag.base.des_segment_count = 1;
1066-
Frag.base.des_segments = &seg;
1067-
#if OPAL_CUDA_SUPPORT
1068-
Frag.hdr = hdr; /* needed for peer rank in control messages */
1069-
#endif /* OPAL_CUDA_SUPPORT */
1070-
reg->cbfunc(&mca_btl_smcuda.super, hdr->tag, &(Frag.base),
1071-
reg->cbdata);
1055+
1056+
mca_btl_active_message_callback_t *reg = mca_btl_base_active_message_trigger + hdr->tag;
1057+
mca_btl_base_receive_descriptor_t recv_desc = {.endpoint = mca_btl_smcuda_component.sm_peers[peer_smp_rank],
1058+
.des_segments = &seg,
1059+
.des_segment_count = 1,
1060+
.tag = hdr->tag,
1061+
.cbdata = reg->cbdata};
1062+
reg->cbfunc(&mca_btl_smcuda.super, &recv_desc);
10721063
/* return the fragment */
10731064
MCA_BTL_SMCUDA_FIFO_WRITE(
10741065
mca_btl_smcuda_component.sm_peers[peer_smp_rank],

0 commit comments

Comments
 (0)