/* -*- Mode: C; c-basic-offset:4 ; indent-tabs-mode:nil -*- */ /* * Copyright (c) 2004-2005 The Trustees of Indiana University and Indiana * University Research and Technology * Corporation. All rights reserved. * Copyright (c) 2004-2005 The University of Tennessee and The University * of Tennessee Research Foundation. All rights * reserved. * Copyright (c) 2004-2005 High Performance Computing Center Stuttgart, * University of Stuttgart. All rights reserved. * Copyright (c) 2004-2005 The Regents of the University of California. * All rights reserved. * Copyright (c) 2009 IBM Corporation. All rights reserved. * Copyright (c) 2012-2015 Los Alamos National Security, LLC. All rights * reserved. * Copyright (c) 2018 Research Organization for Information Science * and Technology (RIST). All rights reserved. * $COPYRIGHT$ * * Additional copyrights may follow * * $HEADER$ */ /** * @file */ #ifndef MCA_PML_OB1_HEADER_H #define MCA_PML_OB1_HEADER_H #include "ompi_config.h" #ifdef HAVE_SYS_TYPES_H #include #endif #ifdef HAVE_NETINET_IN_H #include #endif #include "opal/types.h" #include "opal/util/arch.h" #include "opal/mca/btl/btl.h" #include "ompi/proc/proc.h" #define MCA_PML_OB1_HDR_TYPE_MATCH (MCA_BTL_TAG_PML + 1) #define MCA_PML_OB1_HDR_TYPE_RNDV (MCA_BTL_TAG_PML + 2) #define MCA_PML_OB1_HDR_TYPE_RGET (MCA_BTL_TAG_PML + 3) #define MCA_PML_OB1_HDR_TYPE_ACK (MCA_BTL_TAG_PML + 4) #define MCA_PML_OB1_HDR_TYPE_NACK (MCA_BTL_TAG_PML + 5) #define MCA_PML_OB1_HDR_TYPE_FRAG (MCA_BTL_TAG_PML + 6) #define MCA_PML_OB1_HDR_TYPE_GET (MCA_BTL_TAG_PML + 7) #define MCA_PML_OB1_HDR_TYPE_PUT (MCA_BTL_TAG_PML + 8) #define MCA_PML_OB1_HDR_TYPE_FIN (MCA_BTL_TAG_PML + 9) #define MCA_PML_OB1_HDR_TYPE_CID (MCA_BTL_TAG_PML + 10) #define MCA_PML_OB1_HDR_FLAGS_ACK 0x01 /* is an ack required */ #define MCA_PML_OB1_HDR_FLAGS_NBO 0x02 /* is the hdr in network byte order */ #define MCA_PML_OB1_HDR_FLAGS_PIN 0x04 /* is user buffer pinned */ #define MCA_PML_OB1_HDR_FLAGS_CONTIG 0x08 /* is user buffer contiguous */ #define MCA_PML_OB1_HDR_FLAGS_NORDMA 0x10 /* rest will be send by copy-in-out */ #define MCA_PML_OB1_HDR_FLAGS_SIGNAL 0x20 /* message can be optionally signalling */ /** * Common hdr attributes - must be first element in each hdr type */ struct mca_pml_ob1_common_hdr_t { uint8_t hdr_type; /**< type of envelope */ uint8_t hdr_flags; /**< flags indicating how fragment should be processed */ }; typedef struct mca_pml_ob1_common_hdr_t mca_pml_ob1_common_hdr_t; static inline void mca_pml_ob1_common_hdr_prepare (mca_pml_ob1_common_hdr_t *hdr, uint8_t hdr_type, uint8_t hdr_flags) { hdr->hdr_type = hdr_type; hdr->hdr_flags = hdr_flags; } #define MCA_PML_OB1_COMMON_HDR_NTOH(h) #define MCA_PML_OB1_COMMON_HDR_HTON(h) /** * Header definition for sending a CID/local comm index combo */ struct mca_pml_ob1_cid_hdr_t { mca_pml_ob1_common_hdr_t hdr_common; ompi_comm_extended_cid_t hdr_cid; int16_t hdr_src_comm_index; int32_t hdr_src; }; typedef struct mca_pml_ob1_cid_hdr_t mca_pml_ob1_cid_hdr_t; static inline void mca_pml_ob1_cid_hdr_prepare (mca_pml_ob1_cid_hdr_t *hdr, ompi_communicator_t *comm) { mca_pml_ob1_common_hdr_prepare (&hdr->hdr_common, MCA_PML_OB1_HDR_TYPE_CID, 0); hdr->hdr_cid = ompi_comm_get_extended_cid (comm); hdr->hdr_src_comm_index = comm->c_index; hdr->hdr_src = ompi_comm_rank (comm); } /** * Header definition for the first fragment, contains the * attributes required to match the corresponding posted receive. */ struct mca_pml_ob1_match_hdr_t { mca_pml_ob1_common_hdr_t hdr_common; /**< common attributes */ uint16_t hdr_ctx; /**< communicator index */ int32_t hdr_src; /**< source rank */ int32_t hdr_tag; /**< user tag */ uint16_t hdr_seq; /**< message sequence number */ #if OPAL_ENABLE_HETEROGENEOUS_SUPPORT || OPAL_ENABLE_DEBUG uint8_t hdr_padding[2]; /**< explicitly pad to 16 bytes. Compilers seem to already prefer to do this, but make it explicit just in case */ #endif }; #if OPAL_ENABLE_HETEROGENEOUS_SUPPORT || OPAL_ENABLE_DEBUG #define OMPI_PML_OB1_MATCH_HDR_LEN 16 #else #define OMPI_PML_OB1_MATCH_HDR_LEN 14 #endif typedef struct mca_pml_ob1_match_hdr_t mca_pml_ob1_match_hdr_t; static inline void mca_pml_ob1_match_hdr_prepare (mca_pml_ob1_match_hdr_t *hdr, uint8_t hdr_type, uint8_t hdr_flags, uint16_t hdr_ctx, int32_t hdr_src, int32_t hdr_tag, uint16_t hdr_seq) { mca_pml_ob1_common_hdr_prepare (&hdr->hdr_common, hdr_type, hdr_flags); hdr->hdr_ctx = hdr_ctx; hdr->hdr_src = hdr_src; hdr->hdr_tag = hdr_tag; hdr->hdr_seq = hdr_seq; #if OPAL_ENABLE_DEBUG hdr->hdr_padding[0] = 0; hdr->hdr_padding[1] = 0; #endif } #define MCA_PML_OB1_MATCH_HDR_NTOH(h) \ do { \ MCA_PML_OB1_COMMON_HDR_NTOH((h).hdr_common); \ (h).hdr_ctx = ntohs((h).hdr_ctx); \ (h).hdr_src = ntohl((h).hdr_src); \ (h).hdr_tag = ntohl((h).hdr_tag); \ (h).hdr_seq = ntohs((h).hdr_seq); \ } while (0) #define MCA_PML_OB1_MATCH_HDR_HTON(h) \ do { \ MCA_PML_OB1_COMMON_HDR_HTON((h).hdr_common); \ (h).hdr_ctx = htons((h).hdr_ctx); \ (h).hdr_src = htonl((h).hdr_src); \ (h).hdr_tag = htonl((h).hdr_tag); \ (h).hdr_seq = htons((h).hdr_seq); \ } while (0) #define MCA_PML_OB1_EXT_MATCH_HDR_NTOH(h) \ do {\ MCA_PML_OB1_COMMON_HDR_NTOH((h).hdr_common); \ (h).hdr_cid.cid_base = ntoh64((h).hdr_cid.cid_base); \ (h).hdr_cid.cid_sub.u64 = ntoh64((h).hdr_cid.cid_sub.u64); \ (h).hdr_src_comm_index = ntohs((h).hdr_src_comm_index); \ (h).hdr_src = ntohl((h).hdr_src); \ } while (0) #define MCA_PML_OB1_EXT_MATCH_HDR_HTON(h) \ do {\ MCA_PML_OB1_COMMON_HDR_HTON((h).hdr_common); \ (h).hdr_cid.cid_base = hton64((h).hdr_cid.cid_base); \ (h).hdr_cid.cid_sub.u64 = hton64((h).hdr_cid.cid_sub.u64); \ (h).hdr_src_comm_index = htons((h).hdr_src_comm_index); \ (h).hdr_src = htonl((h).hdr_src); \ } while (0) struct mca_pml_ob1_ext_match_hdr_t { mca_pml_ob1_cid_hdr_t hdr_ext_cid; /* actual match */ mca_pml_ob1_match_hdr_t hdr_match; }; typedef struct mca_pml_ob1_ext_match_hdr_t mca_pml_ob1_ext_match_hdr_t; /* * * Header definition for the first fragment when an acknowledgment * is required. This could be the first fragment of a large message * or a short message that requires an ack (synchronous). */ struct mca_pml_ob1_rendezvous_hdr_t { mca_pml_ob1_match_hdr_t hdr_match; uint64_t hdr_msg_length; /**< message length */ opal_ptr_t hdr_src_req; /**< pointer to source request - returned in ack */ }; typedef struct mca_pml_ob1_rendezvous_hdr_t mca_pml_ob1_rendezvous_hdr_t; struct mca_pml_ob1_ext_rendezvous_hdr_t { mca_pml_ob1_cid_hdr_t hdr_ext_cid; /* actual match */ mca_pml_ob1_rendezvous_hdr_t hdr_rndv; }; typedef struct mca_pml_ob1_ext_rendezvous_hdr_t mca_pml_ob1_ext_rendezvous_hdr_t; static inline void mca_pml_ob1_rendezvous_hdr_prepare (mca_pml_ob1_rendezvous_hdr_t *hdr, uint8_t hdr_type, uint8_t hdr_flags, uint16_t hdr_ctx, int32_t hdr_src, int32_t hdr_tag, uint16_t hdr_seq, uint64_t hdr_msg_length, void *hdr_src_req) { mca_pml_ob1_match_hdr_prepare (&hdr->hdr_match, hdr_type, hdr_flags, hdr_ctx, hdr_src, hdr_tag, hdr_seq); hdr->hdr_msg_length = hdr_msg_length; hdr->hdr_src_req.pval = hdr_src_req; } /* Note that hdr_src_req is not put in network byte order because it is never processed by the receiver, other than being copied into the ack header */ #define MCA_PML_OB1_RNDV_HDR_NTOH(h) \ do { \ MCA_PML_OB1_MATCH_HDR_NTOH((h).hdr_match); \ (h).hdr_msg_length = ntoh64((h).hdr_msg_length); \ } while (0) #define MCA_PML_OB1_RNDV_HDR_HTON(h) \ do { \ MCA_PML_OB1_MATCH_HDR_HTON((h).hdr_match); \ (h).hdr_msg_length = hton64((h).hdr_msg_length); \ } while (0) /** * Header definition for a combined rdma rendezvous/get */ struct mca_pml_ob1_rget_hdr_t { mca_pml_ob1_rendezvous_hdr_t hdr_rndv; #if OPAL_ENABLE_HETEROGENEOUS_SUPPORT || OPAL_ENABLE_DEBUG uint8_t hdr_padding[4]; #endif opal_ptr_t hdr_frag; /**< source fragment (for fin) */ uint64_t hdr_src_ptr; /**< source pointer */ /* btl registration handle data follows */ }; typedef struct mca_pml_ob1_rget_hdr_t mca_pml_ob1_rget_hdr_t; struct mca_pml_ob1_ext_rget_hdr_t { mca_pml_ob1_cid_hdr_t hdr_ext_cid; /* actual match */ mca_pml_ob1_rget_hdr_t hdr_rget; }; typedef struct mca_pml_ob1_ext_rget_hdr_t mca_pml_ob1_ext_rget_hdr_t; static inline void mca_pml_ob1_rget_hdr_prepare (mca_pml_ob1_rget_hdr_t *hdr, uint8_t hdr_flags, uint16_t hdr_ctx, int32_t hdr_src, int32_t hdr_tag, uint16_t hdr_seq, uint64_t hdr_msg_length, void *hdr_src_req, void *hdr_frag, void *hdr_src_ptr, void *local_handle, size_t local_handle_size) { mca_pml_ob1_rendezvous_hdr_prepare (&hdr->hdr_rndv, MCA_PML_OB1_HDR_TYPE_RGET, hdr_flags, hdr_ctx, hdr_src, hdr_tag, hdr_seq, hdr_msg_length, hdr_src_req); #if OPAL_ENABLE_DEBUG hdr->hdr_padding[0] = 0; hdr->hdr_padding[1] = 0; hdr->hdr_padding[2] = 0; hdr->hdr_padding[3] = 0; #endif hdr->hdr_frag.pval = hdr_frag; hdr->hdr_src_ptr = (uint64_t)(intptr_t) hdr_src_ptr; /* copy registration handle */ memcpy (hdr + 1, local_handle, local_handle_size); } #define MCA_PML_OB1_RGET_HDR_NTOH(h) \ do { \ MCA_PML_OB1_RNDV_HDR_NTOH((h).hdr_rndv); \ (h).hdr_src_ptr = ntoh64((h).hdr_src_ptr); \ } while (0) #define MCA_PML_OB1_RGET_HDR_HTON(h) \ do { \ MCA_PML_OB1_RNDV_HDR_HTON((h).hdr_rndv); \ (h).hdr_src_ptr = hton64((h).hdr_src_ptr); \ } while (0) /** * Header for subsequent fragments. */ struct mca_pml_ob1_frag_hdr_t { mca_pml_ob1_common_hdr_t hdr_common; /**< common attributes */ #if OPAL_ENABLE_HETEROGENEOUS_SUPPORT || OPAL_ENABLE_DEBUG uint8_t hdr_padding[6]; #endif uint64_t hdr_frag_offset; /**< offset into message */ opal_ptr_t hdr_src_req; /**< pointer to source request */ opal_ptr_t hdr_dst_req; /**< pointer to matched receive */ }; typedef struct mca_pml_ob1_frag_hdr_t mca_pml_ob1_frag_hdr_t; static inline void mca_pml_ob1_frag_hdr_prepare (mca_pml_ob1_frag_hdr_t *hdr, uint8_t hdr_flags, uint64_t hdr_frag_offset, void *hdr_src_req, uint64_t hdr_dst_req) { mca_pml_ob1_common_hdr_prepare (&hdr->hdr_common, MCA_PML_OB1_HDR_TYPE_FRAG, hdr_flags); #if OPAL_ENABLE_DEBUG hdr->hdr_padding[0] = 0; hdr->hdr_padding[1] = 0; hdr->hdr_padding[2] = 0; hdr->hdr_padding[3] = 0; hdr->hdr_padding[4] = 0; hdr->hdr_padding[5] = 0; #endif hdr->hdr_frag_offset = hdr_frag_offset; hdr->hdr_src_req.pval = hdr_src_req; hdr->hdr_dst_req.lval = hdr_dst_req; } #define MCA_PML_OB1_FRAG_HDR_NTOH(h) \ do { \ MCA_PML_OB1_COMMON_HDR_NTOH((h).hdr_common); \ (h).hdr_frag_offset = ntoh64((h).hdr_frag_offset); \ } while (0) #define MCA_PML_OB1_FRAG_HDR_HTON(h) \ do { \ MCA_PML_OB1_COMMON_HDR_HTON((h).hdr_common); \ (h).hdr_frag_offset = hton64((h).hdr_frag_offset); \ } while (0) /** * Header used to acknowledgment outstanding fragment(s). */ struct mca_pml_ob1_ack_hdr_t { mca_pml_ob1_common_hdr_t hdr_common; /**< common attributes */ #if OPAL_ENABLE_HETEROGENEOUS_SUPPORT || OPAL_ENABLE_DEBUG uint8_t hdr_padding[6]; #endif opal_ptr_t hdr_src_req; /**< source request */ opal_ptr_t hdr_dst_req; /**< matched receive request */ uint64_t hdr_send_offset; /**< starting point of copy in/out */ uint64_t hdr_send_size; /**< number of bytes requested (0: all remaining) */ }; typedef struct mca_pml_ob1_ack_hdr_t mca_pml_ob1_ack_hdr_t; static inline void mca_pml_ob1_ack_hdr_prepare (mca_pml_ob1_ack_hdr_t *hdr, uint8_t hdr_flags, uint64_t hdr_src_req, void *hdr_dst_req, uint64_t hdr_send_offset, uint64_t hdr_send_size) { mca_pml_ob1_common_hdr_prepare (&hdr->hdr_common, MCA_PML_OB1_HDR_TYPE_ACK, hdr_flags); #if OPAL_ENABLE_DEBUG hdr->hdr_padding[0] = 0; hdr->hdr_padding[1] = 0; hdr->hdr_padding[2] = 0; hdr->hdr_padding[3] = 0; hdr->hdr_padding[4] = 0; hdr->hdr_padding[5] = 0; #endif hdr->hdr_src_req.lval = hdr_src_req; hdr->hdr_dst_req.pval = hdr_dst_req; hdr->hdr_send_offset = hdr_send_offset; hdr->hdr_send_size = hdr_send_size; } /* Note that the request headers are not put in NBO because the src_req is already in receiver's byte order and the dst_req is not used by the receiver for anything other than backpointers in return headers */ #define MCA_PML_OB1_ACK_HDR_NTOH(h) \ do { \ MCA_PML_OB1_COMMON_HDR_NTOH((h).hdr_common); \ (h).hdr_send_offset = ntoh64((h).hdr_send_offset); \ (h).hdr_send_size = ntoh64((h).hdr_send_size); \ } while (0) #define MCA_PML_OB1_ACK_HDR_HTON(h) \ do { \ MCA_PML_OB1_COMMON_HDR_HTON((h).hdr_common); \ (h).hdr_send_offset = hton64((h).hdr_send_offset); \ (h).hdr_send_size = hton64((h).hdr_send_size); \ } while (0) /** * Header used to initiate an RDMA operation. */ struct mca_pml_ob1_rdma_hdr_t { mca_pml_ob1_common_hdr_t hdr_common; /**< common attributes */ #if OPAL_ENABLE_HETEROGENEOUS_SUPPORT || OPAL_ENABLE_DEBUG uint8_t hdr_padding[6]; /** two to pad out the hdr to a 4 byte alignment. hdr_req will then be 8 byte aligned after 4 for hdr_seg_cnt */ #endif /* TODO: add real support for multiple destination segments */ opal_ptr_t hdr_req; /**< destination request */ opal_ptr_t hdr_frag; /**< receiver fragment */ opal_ptr_t hdr_recv_req; /**< receive request (NTH: needed for put fallback on send) */ uint64_t hdr_rdma_offset; /**< current offset into user buffer */ uint64_t hdr_dst_ptr; /**< destination address */ uint64_t hdr_dst_size; /**< destination size */ /* registration data follows */ }; typedef struct mca_pml_ob1_rdma_hdr_t mca_pml_ob1_rdma_hdr_t; static inline void mca_pml_ob1_rdma_hdr_prepare (mca_pml_ob1_rdma_hdr_t *hdr, uint8_t hdr_flags, uint64_t hdr_req, void *hdr_frag, void *hdr_recv_req, uint64_t hdr_rdma_offset, void *hdr_dst_ptr, uint64_t hdr_dst_size, void *local_handle, size_t local_handle_size) { mca_pml_ob1_common_hdr_prepare (&hdr->hdr_common, MCA_PML_OB1_HDR_TYPE_PUT, hdr_flags); #if OPAL_ENABLE_DEBUG hdr->hdr_padding[0] = 0; hdr->hdr_padding[1] = 0; hdr->hdr_padding[2] = 0; hdr->hdr_padding[3] = 0; hdr->hdr_padding[4] = 0; hdr->hdr_padding[5] = 0; #endif hdr->hdr_req.lval = hdr_req; hdr->hdr_frag.pval = hdr_frag; hdr->hdr_recv_req.pval = hdr_recv_req; hdr->hdr_rdma_offset = hdr_rdma_offset; hdr->hdr_dst_ptr = (uint64_t)(intptr_t) hdr_dst_ptr; hdr->hdr_dst_size = hdr_dst_size; /* copy segments */ memcpy (hdr + 1, local_handle, local_handle_size); } #define MCA_PML_OB1_RDMA_HDR_NTOH(h) \ do { \ MCA_PML_OB1_COMMON_HDR_NTOH((h).hdr_common); \ (h).hdr_rdma_offset = ntoh64((h).hdr_rdma_offset); \ (h).hdr_dst_ptr = ntoh64((h).hdr_dst_ptr); \ (h).hdr_dst_size = ntoh64((h).hdr_dst_size); \ } while (0) #define MCA_PML_OB1_RDMA_HDR_HTON(h) \ do { \ MCA_PML_OB1_COMMON_HDR_HTON((h).hdr_common); \ (h).hdr_rdma_offset = hton64((h).hdr_rdma_offset); \ (h).hdr_dst_ptr = hton64((h).hdr_dst_ptr); \ (h).hdr_dst_size = hton64((h).hdr_dst_size); \ } while (0) /** * Header used to complete an RDMA operation. */ struct mca_pml_ob1_fin_hdr_t { mca_pml_ob1_common_hdr_t hdr_common; /**< common attributes */ #if OPAL_ENABLE_HETEROGENEOUS_SUPPORT || OPAL_ENABLE_DEBUG uint8_t hdr_padding[6]; #endif int64_t hdr_size; /**< number of bytes completed (positive), error code (negative) */ opal_ptr_t hdr_frag; /**< completed RDMA fragment */ }; typedef struct mca_pml_ob1_fin_hdr_t mca_pml_ob1_fin_hdr_t; static inline void mca_pml_ob1_fin_hdr_prepare (mca_pml_ob1_fin_hdr_t *hdr, uint8_t hdr_flags, uint64_t hdr_frag, int64_t hdr_size) { mca_pml_ob1_common_hdr_prepare (&hdr->hdr_common, MCA_PML_OB1_HDR_TYPE_FIN, hdr_flags); #if OPAL_ENABLE_DEBUG hdr->hdr_padding[0] = 0; hdr->hdr_padding[1] = 0; hdr->hdr_padding[2] = 0; hdr->hdr_padding[3] = 0; hdr->hdr_padding[4] = 0; hdr->hdr_padding[5] = 0; #endif hdr->hdr_frag.lval = hdr_frag; hdr->hdr_size = hdr_size; } #define MCA_PML_OB1_FIN_HDR_NTOH(h) \ do { \ MCA_PML_OB1_COMMON_HDR_NTOH((h).hdr_common); \ (h).hdr_size = ntoh64((h).hdr_size); \ } while (0) #define MCA_PML_OB1_FIN_HDR_HTON(h) \ do { \ MCA_PML_OB1_COMMON_HDR_HTON((h).hdr_common); \ (h).hdr_size = hton64((h).hdr_size); \ } while (0) /** * Union of defined hdr types. */ union mca_pml_ob1_hdr_t { mca_pml_ob1_common_hdr_t hdr_common; mca_pml_ob1_match_hdr_t hdr_match; mca_pml_ob1_rendezvous_hdr_t hdr_rndv; mca_pml_ob1_rget_hdr_t hdr_rget; mca_pml_ob1_frag_hdr_t hdr_frag; mca_pml_ob1_ack_hdr_t hdr_ack; mca_pml_ob1_rdma_hdr_t hdr_rdma; mca_pml_ob1_fin_hdr_t hdr_fin; /* extended CID support */ mca_pml_ob1_cid_hdr_t hdr_cid; mca_pml_ob1_ext_match_hdr_t hdr_ext_match; mca_pml_ob1_ext_rendezvous_hdr_t hdr_ext_rndv; mca_pml_ob1_ext_rget_hdr_t hdr_ext_rget; }; typedef union mca_pml_ob1_hdr_t mca_pml_ob1_hdr_t; #if !defined(WORDS_BIGENDIAN) && OPAL_ENABLE_HETEROGENEOUS_SUPPORT static inline void ob1_hdr_ntoh(mca_pml_ob1_hdr_t *hdr, const uint8_t hdr_type) { if(!(hdr->hdr_common.hdr_flags & MCA_PML_OB1_HDR_FLAGS_NBO)) return; switch(hdr_type) { case MCA_PML_OB1_HDR_TYPE_MATCH: MCA_PML_OB1_MATCH_HDR_NTOH(hdr->hdr_match); break; case MCA_PML_OB1_HDR_TYPE_RNDV: MCA_PML_OB1_RNDV_HDR_NTOH(hdr->hdr_rndv); break; case MCA_PML_OB1_HDR_TYPE_RGET: MCA_PML_OB1_RGET_HDR_NTOH(hdr->hdr_rget); break; case MCA_PML_OB1_HDR_TYPE_ACK: MCA_PML_OB1_ACK_HDR_NTOH(hdr->hdr_ack); break; case MCA_PML_OB1_HDR_TYPE_FRAG: MCA_PML_OB1_FRAG_HDR_NTOH(hdr->hdr_frag); break; case MCA_PML_OB1_HDR_TYPE_PUT: MCA_PML_OB1_RDMA_HDR_NTOH(hdr->hdr_rdma); break; case MCA_PML_OB1_HDR_TYPE_FIN: MCA_PML_OB1_FIN_HDR_NTOH(hdr->hdr_fin); break; case MCA_PML_OB1_HDR_TYPE_CID: { mca_pml_ob1_hdr_t *next_hdr = (mca_pml_ob1_hdr_t *) ((uintptr_t) hdr + sizeof (hdr->hdr_cid)); MCA_PML_OB1_EXT_MATCH_HDR_NTOH(hdr->hdr_cid); /* now swap the real header */ ob1_hdr_ntoh (next_hdr, next_hdr->hdr_common.hdr_type); break; } default: assert(0); break; } } #else #define ob1_hdr_ntoh(h, t) do{}while(0) #endif #if OPAL_ENABLE_HETEROGENEOUS_SUPPORT #define ob1_hdr_hton(h, t, p) \ ob1_hdr_hton_intr((mca_pml_ob1_hdr_t*)h, t, p) static inline void ob1_hdr_hton_intr(mca_pml_ob1_hdr_t *hdr, const uint8_t hdr_type, const ompi_proc_t *proc) { #ifdef WORDS_BIGENDIAN hdr->hdr_common.hdr_flags |= MCA_PML_OB1_HDR_FLAGS_NBO; #else if(!(proc->super.proc_arch & OPAL_ARCH_ISBIGENDIAN)) return; hdr->hdr_common.hdr_flags |= MCA_PML_OB1_HDR_FLAGS_NBO; switch(hdr_type) { case MCA_PML_OB1_HDR_TYPE_MATCH: MCA_PML_OB1_MATCH_HDR_HTON(hdr->hdr_match); break; case MCA_PML_OB1_HDR_TYPE_RNDV: MCA_PML_OB1_RNDV_HDR_HTON(hdr->hdr_rndv); break; case MCA_PML_OB1_HDR_TYPE_RGET: MCA_PML_OB1_RGET_HDR_HTON(hdr->hdr_rget); break; case MCA_PML_OB1_HDR_TYPE_ACK: MCA_PML_OB1_ACK_HDR_HTON(hdr->hdr_ack); break; case MCA_PML_OB1_HDR_TYPE_FRAG: MCA_PML_OB1_FRAG_HDR_HTON(hdr->hdr_frag); break; case MCA_PML_OB1_HDR_TYPE_PUT: MCA_PML_OB1_RDMA_HDR_HTON(hdr->hdr_rdma); break; case MCA_PML_OB1_HDR_TYPE_FIN: MCA_PML_OB1_FIN_HDR_HTON(hdr->hdr_fin); break; case MCA_PML_OB1_HDR_TYPE_CID: { mca_pml_ob1_hdr_t *next_hdr = (mca_pml_ob1_hdr_t *) ((uintptr_t) hdr + sizeof (hdr->hdr_cid)); MCA_PML_OB1_EXT_MATCH_HDR_HTON(hdr->hdr_cid); /* now swap the real header */ ob1_hdr_hton (next_hdr, next_hdr->hdr_common.hdr_type, proc); break; } default: assert(0); break; } #endif } #else #define ob1_hdr_hton(h, t, p) do{}while(0) #endif static inline __opal_attribute_always_inline__ void ob1_hdr_copy(mca_pml_ob1_hdr_t *src, mca_pml_ob1_hdr_t *dst) { do { switch(src->hdr_common.hdr_type) { case MCA_PML_OB1_HDR_TYPE_MATCH: memcpy( &(dst->hdr_match), &(src->hdr_match), sizeof(mca_pml_ob1_match_hdr_t) ); break; case MCA_PML_OB1_HDR_TYPE_RNDV: memcpy( &(dst->hdr_rndv), &(src->hdr_rndv), sizeof(mca_pml_ob1_rendezvous_hdr_t) ); break; case MCA_PML_OB1_HDR_TYPE_RGET: memcpy( &(dst->hdr_rget), &(src->hdr_rget), sizeof(mca_pml_ob1_rget_hdr_t) ); break; case MCA_PML_OB1_HDR_TYPE_ACK: memcpy( &(dst->hdr_ack), &(src->hdr_ack), sizeof(mca_pml_ob1_ack_hdr_t) ); break; case MCA_PML_OB1_HDR_TYPE_FRAG: memcpy( &(dst->hdr_frag), &(src->hdr_frag), sizeof(mca_pml_ob1_frag_hdr_t) ); break; case MCA_PML_OB1_HDR_TYPE_PUT: memcpy( &(dst->hdr_rdma), &(src->hdr_rdma), sizeof(mca_pml_ob1_rdma_hdr_t) ); break; case MCA_PML_OB1_HDR_TYPE_FIN: memcpy( &(dst->hdr_fin), &(src->hdr_fin), sizeof(mca_pml_ob1_fin_hdr_t) ); break; case MCA_PML_OB1_HDR_TYPE_CID: { mca_pml_ob1_hdr_t *next_src = (mca_pml_ob1_hdr_t *) ((uintptr_t) src + sizeof (src->hdr_cid)); mca_pml_ob1_hdr_t *next_dst = (mca_pml_ob1_hdr_t *) ((uintptr_t) dst + sizeof (dst->hdr_cid)); memcpy (&dst->hdr_cid, &src->hdr_cid, sizeof (src->hdr_cid)); /* can't call recursively and expect inlining */ src = next_src; dst = next_dst; continue; } default: memcpy( &(dst->hdr_common), &(src->hdr_common), sizeof(mca_pml_ob1_common_hdr_t) ); break; } break; } while (1); } #endif /* MCA_PML_OB1_HEADER_H */