-
Notifications
You must be signed in to change notification settings - Fork 875
/
Copy pathopal_datatype.h
358 lines (316 loc) · 15.4 KB
/
opal_datatype.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
/* -*- Mode: C; c-basic-offset:4 ; indent-tabs-mode:nil -*- */
/*
* Copyright (c) 2004-2006 The Trustees of Indiana University and Indiana
* University Research and Technology
* Corporation. All rights reserved.
* Copyright (c) 2004-2017 The University of Tennessee and The University
* of Tennessee Research Foundation. All rights
* reserved.
* Copyright (c) 2004-2006 High Performance Computing Center Stuttgart,
* University of Stuttgart. All rights reserved.
* Copyright (c) 2004-2006 The Regents of the University of California.
* All rights reserved.
* Copyright (c) 2007-2013 Los Alamos National Security, LLC. All rights
* reserved.
* Copyright (c) 2009 Sun Microsystems, Inc. All rights reserved.
* Copyright (c) 2009 Oak Ridge National Labs. All rights reserved.
* Copyright (c) 2017-2018 Research Organization for Information Science
* and Technology (RIST). All rights reserved.
* Copyright (c) 2018 Triad National Security, LLC. All rights
* reserved.
* Copyright (c) 2018 FUJITSU LIMITED. All rights reserved.
* $COPYRIGHT$
*
* Additional copyrights may follow
*
* $HEADER$
*/
/**
* opal_datatype_t interface for OPAL internal data type representation
*
* opal_datatype_t is a class which represents contiguous or
* non-contiguous data together with constituent type-related
* information.
*/
#ifndef OPAL_DATATYPE_H_HAS_BEEN_INCLUDED
#define OPAL_DATATYPE_H_HAS_BEEN_INCLUDED
#include "opal_config.h"
#include <stddef.h>
#include "opal/class/opal_object.h"
BEGIN_C_DECLS
/*
* If there are more basic datatypes than the number of bytes in the int type
* the bdt_used field of the data description struct should be changed to long.
*
* This must match the same definition as in opal_datatype_internal.h
*/
#if !defined(OPAL_DATATYPE_MAX_PREDEFINED)
# define OPAL_DATATYPE_MAX_PREDEFINED 28
#endif
/*
* Upper limit of the number of _Basic_ datatypes supported (in order to
* not change setup and usage of the predefined datatypes).
*
* BEWARE: This constant should reflect whatever the OMPI-layer needs.
*/
#define OPAL_DATATYPE_MAX_SUPPORTED 64
/* flags for the datatypes. */
#define OPAL_DATATYPE_FLAG_UNAVAILABLE \
0x0001 /**< datatypes unavailable on the build (OS or compiler dependant) */
#define OPAL_DATATYPE_FLAG_PREDEFINED \
0x0002 /**< cannot be removed: initial and predefined datatypes */
#define OPAL_DATATYPE_FLAG_COMMITTED 0x0004 /**< ready to be used for a send/recv operation */
#define OPAL_DATATYPE_FLAG_OVERLAP 0x0008 /**< datatype is unpropper for a recv operation */
#define OPAL_DATATYPE_FLAG_CONTIGUOUS 0x0010 /**< contiguous datatype */
#define OPAL_DATATYPE_FLAG_NO_GAPS \
0x0020 /**< no gaps around the datatype, aka OPAL_DATATYPE_FLAG_CONTIGUOUS and extent == size \
*/
#define OPAL_DATATYPE_FLAG_USER_LB 0x0040 /**< has a user defined LB */
#define OPAL_DATATYPE_FLAG_USER_UB 0x0080 /**< has a user defined UB */
#define OPAL_DATATYPE_FLAG_DATA 0x0100 /**< data or control structure */
/*
* We should make the difference here between the predefined contiguous and non contiguous
* datatypes. The OPAL_DATATYPE_FLAG_BASIC is held by all predefined contiguous datatypes.
*/
#define OPAL_DATATYPE_FLAG_BASIC \
(OPAL_DATATYPE_FLAG_PREDEFINED | OPAL_DATATYPE_FLAG_CONTIGUOUS | OPAL_DATATYPE_FLAG_NO_GAPS \
| OPAL_DATATYPE_FLAG_DATA | OPAL_DATATYPE_FLAG_COMMITTED)
/*
* If during the datatype optimization process we collapse contiguous elements with
* different types, we cannot use this optimized description for any communication
* in a heterogeneous setting, especially not for the exteranl32 support.
*
* A datatype with this flag cannot use the optimized description in heterogeneous
* setups.
*/
#define OPAL_DATATYPE_OPTIMIZED_RESTRICTED 0x1000
/**
* The number of supported entries in the data-type definition and the
* associated type.
*/
#define MAX_DT_COMPONENT_COUNT UINT_MAX
typedef size_t opal_datatype_count_t;
typedef union dt_elem_desc dt_elem_desc_t;
struct dt_type_desc_t {
opal_datatype_count_t length; /**< the maximum number of elements in the description array */
opal_datatype_count_t used; /**< the number of used elements in the description array */
dt_elem_desc_t *desc;
};
typedef struct dt_type_desc_t dt_type_desc_t;
/*
* The datatype description.
*/
struct opal_datatype_t {
opal_object_t super; /**< basic superclass */
uint16_t flags; /**< the flags */
uint16_t id; /**< data id, normally the index in the data array. */
uint32_t bdt_used; /**< bitset of which basic datatypes are used in the data description */
size_t size; /**< total size in bytes of the memory used by the data if
the data is put on a contiguous buffer */
ptrdiff_t true_lb; /**< the true lb of the data without user defined lb and ub */
ptrdiff_t true_ub; /**< the true ub of the data without user defined lb and ub */
ptrdiff_t lb; /**< lower bound in memory */
ptrdiff_t ub; /**< upper bound in memory */
/* --- cacheline 1 boundary (64 bytes) --- */
size_t nbElems; /**< total number of elements inside the datatype */
uint32_t align; /**< data should be aligned to */
uint32_t loops; /**< number of loops on the iternal type stack */
/* Attribute fields */
char name[OPAL_MAX_OBJECT_NAME]; /**< name of the datatype */
dt_type_desc_t desc; /**< the data description */
dt_type_desc_t opt_desc; /**< short description of the data used when conversion is useless
or in the send case (without conversion) */
size_t *ptypes; /**< array of basic predefined types that facilitate the computing
of the remote size in heterogeneous environments. The length of the
array is dependent on the maximum number of predefined datatypes of
all language interfaces (because Fortran is not known at the OPAL
layer). This field should never be initialized in homogeneous
environments */
/* --- cacheline 5 boundary (320 bytes) was 32-36 bytes ago --- */
/* size: 352, cachelines: 6, members: 15 */
/* last cacheline: 28-32 bytes */
};
typedef struct opal_datatype_t opal_datatype_t;
OPAL_DECLSPEC OBJ_CLASS_DECLARATION(opal_datatype_t);
OPAL_DECLSPEC extern const opal_datatype_t
*opal_datatype_basicDatatypes[OPAL_DATATYPE_MAX_PREDEFINED];
OPAL_DECLSPEC extern const size_t opal_datatype_local_sizes[OPAL_DATATYPE_MAX_PREDEFINED];
/* Local Architecture as provided by opal_arch_compute_local_id() */
OPAL_DECLSPEC extern uint32_t opal_local_arch;
/*
* The OPAL-layer's Basic datatypes themselves.
*/
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_empty;
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_loop;
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_end_loop;
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_lb;
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_ub;
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_int1; /* in bytes */
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_int2; /* in bytes */
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_int4; /* in bytes */
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_int8; /* in bytes */
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_int16; /* in bytes */
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_uint1; /* in bytes */
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_uint2; /* in bytes */
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_uint4; /* in bytes */
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_uint8; /* in bytes */
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_uint16; /* in bytes */
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_float2; /* in bytes */
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_float4; /* in bytes */
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_float8; /* in bytes */
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_float12; /* in bytes */
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_float16; /* in bytes */
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_short_float_complex;
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_float_complex;
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_double_complex;
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_long_double_complex;
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_bool;
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_wchar;
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_long;
OPAL_DECLSPEC extern const opal_datatype_t opal_datatype_unsigned_long;
/*
* Functions exported externally
*/
int opal_datatype_register_params(void);
OPAL_DECLSPEC int32_t opal_datatype_init(void);
OPAL_DECLSPEC opal_datatype_t *opal_datatype_create(int32_t expectedSize);
OPAL_DECLSPEC int32_t opal_datatype_create_desc(opal_datatype_t *datatype, int32_t expectedSize);
OPAL_DECLSPEC int32_t opal_datatype_commit(opal_datatype_t *pData);
OPAL_DECLSPEC int32_t opal_datatype_destroy(opal_datatype_t **);
OPAL_DECLSPEC int32_t opal_datatype_is_monotonic(opal_datatype_t *type);
static inline int32_t opal_datatype_is_committed(const opal_datatype_t *type)
{
return ((type->flags & OPAL_DATATYPE_FLAG_COMMITTED) == OPAL_DATATYPE_FLAG_COMMITTED);
}
static inline int32_t opal_datatype_is_overlapped(const opal_datatype_t *type)
{
return ((type->flags & OPAL_DATATYPE_FLAG_OVERLAP) == OPAL_DATATYPE_FLAG_OVERLAP);
}
static inline int32_t opal_datatype_is_valid(const opal_datatype_t *type)
{
return !((type->flags & OPAL_DATATYPE_FLAG_UNAVAILABLE) == OPAL_DATATYPE_FLAG_UNAVAILABLE);
}
static inline int32_t opal_datatype_is_predefined(const opal_datatype_t *type)
{
return (type->flags & OPAL_DATATYPE_FLAG_PREDEFINED);
}
/*
* This function return true (1) if the datatype representation depending on the count
* is contiguous in the memory. And false (0) otherwise.
*/
static inline int32_t opal_datatype_is_contiguous_memory_layout(const opal_datatype_t *datatype,
int32_t count)
{
if (!(datatype->flags & OPAL_DATATYPE_FLAG_CONTIGUOUS))
return 0;
if ((count == 1) || (datatype->flags & OPAL_DATATYPE_FLAG_NO_GAPS))
return 1;
return 0;
}
OPAL_DECLSPEC void opal_datatype_dump(const opal_datatype_t *pData);
/* data creation functions */
/**
* Create a duplicate of the source datatype.
*/
OPAL_DECLSPEC int32_t opal_datatype_clone(const opal_datatype_t *src_type,
opal_datatype_t *dest_type);
/**
* A contiguous array of identical datatypes.
*/
OPAL_DECLSPEC int32_t opal_datatype_create_contiguous(int count, const opal_datatype_t *oldType,
opal_datatype_t **newType);
/**
* Add a new datatype to the base type description. The count is the number
* repetitions of the same element to be added, and the extent is the extent
* of each element. The displacement is the initial displacement of the
* first element.
*/
OPAL_DECLSPEC int32_t opal_datatype_add(opal_datatype_t *pdtBase, const opal_datatype_t *pdtAdd,
size_t count, ptrdiff_t disp, ptrdiff_t extent);
/**
* Alter the lb and extent of an existing datatype in place.
*/
OPAL_DECLSPEC int32_t opal_datatype_resize(opal_datatype_t *type, ptrdiff_t lb, ptrdiff_t extent);
static inline int32_t opal_datatype_type_lb(const opal_datatype_t *pData, ptrdiff_t *disp)
{
*disp = pData->lb;
return 0;
}
static inline int32_t opal_datatype_type_ub(const opal_datatype_t *pData, ptrdiff_t *disp)
{
*disp = pData->ub;
return 0;
}
static inline int32_t opal_datatype_type_size(const opal_datatype_t *pData, size_t *size)
{
*size = pData->size;
return 0;
}
static inline int32_t opal_datatype_type_extent(const opal_datatype_t *pData, ptrdiff_t *extent)
{
*extent = pData->ub - pData->lb;
return 0;
}
static inline int32_t opal_datatype_get_extent(const opal_datatype_t *pData, ptrdiff_t *lb,
ptrdiff_t *extent)
{
*lb = pData->lb;
*extent = pData->ub - pData->lb;
return 0;
}
static inline int32_t opal_datatype_get_true_extent(const opal_datatype_t *pData,
ptrdiff_t *true_lb, ptrdiff_t *true_extent)
{
*true_lb = pData->true_lb;
*true_extent = (pData->true_ub - pData->true_lb);
return 0;
}
OPAL_DECLSPEC ssize_t opal_datatype_get_element_count(const opal_datatype_t *pData, size_t iSize);
OPAL_DECLSPEC int32_t opal_datatype_set_element_count(const opal_datatype_t *pData, size_t count,
size_t *length);
OPAL_DECLSPEC int32_t opal_datatype_copy_content_same_ddt(const opal_datatype_t *pData,
int32_t count, char *pDestBuf,
char *pSrcBuf);
OPAL_DECLSPEC int opal_datatype_compute_ptypes(opal_datatype_t *datatype);
/*
* Compute the size of the datatype using a specific set of predefined type sizes.
* This function allows to compute the size of a packed buffer without creating
* a fully fledged specialized convertor for the remote peer.
*/
OPAL_DECLSPEC size_t
opal_datatype_compute_remote_size(const opal_datatype_t *pData,
const size_t *sizes);
/* Compute the span in memory of count datatypes. This function help with temporary
* memory allocations for receiving already typed data (such as those used for reduce
* operations). This span is the distance between the minimum and the maximum byte
* in the memory layout of count datatypes, or in other terms the memory needed to
* allocate count times the datatype without the gap in the beginning and at the end.
*
* Returns: the memory span of count repetition of the datatype, and in the gap
* argument, the number of bytes of the gap at the beginning.
*/
static inline ptrdiff_t opal_datatype_span(const opal_datatype_t *pData, size_t count,
ptrdiff_t *gap)
{
if (OPAL_UNLIKELY(0 == pData->size) || (0 == count)) {
*gap = 0;
return 0;
}
*gap = pData->true_lb;
ptrdiff_t extent = (pData->ub - pData->lb);
ptrdiff_t true_extent = (pData->true_ub - pData->true_lb);
return true_extent + extent * (count - 1);
}
#if OPAL_ENABLE_DEBUG
/*
* Set a breakpoint to this function in your favorite debugger
* to make it stop on all pack and unpack errors.
*/
OPAL_DECLSPEC int opal_datatype_safeguard_pointer_debug_breakpoint(const void *actual_ptr,
int length,
const void *initial_ptr,
const opal_datatype_t *pData,
int count);
#endif /* OPAL_ENABLE_DEBUG */
END_C_DECLS
#endif /* OPAL_DATATYPE_H_HAS_BEEN_INCLUDED */