• Home
  • Features
  • Pricing
  • Docs
  • Announcements
  • Sign In

daisytuner / sdfglib / 21478974613

29 Jan 2026 12:55PM UTC coverage: 65.778% (-0.07%) from 65.843%
21478974613

push

github

web-flow
Merge pull request #485 from daisytuner/npbench-cavity-flow

Adds support for npbench's cavity_flow

59 of 130 new or added lines in 6 files covered. (45.38%)

1 existing line in 1 file now uncovered.

22446 of 34124 relevant lines covered (65.78%)

382.63 hits per line

Source File
Press 'n' to go to next uncovered line, 'b' for previous

35.44
/sdfg/src/codegen/language_extensions/cuda_language_extension.cpp
1
#include "sdfg/codegen/language_extensions/cuda_language_extension.h"
2

3
#include "sdfg/codegen/language_extensions/cpp_language_extension.h"
4
#include "sdfg/codegen/utils.h"
5
#include "sdfg/data_flow/library_node.h"
6
#include "sdfg/data_flow/tasklet.h"
7

8
namespace sdfg {
9
namespace codegen {
10

11
std::string CUDALanguageExtension::primitive_type(const types::PrimitiveType prim_type) {
41✔
12
    switch (prim_type) {
41✔
13
        case types::PrimitiveType::Void:
1✔
14
            return "void";
1✔
15
        case types::PrimitiveType::Bool:
1✔
16
            return "bool";
1✔
17
        case types::PrimitiveType::Int8:
1✔
18
            return "signed char";
1✔
19
        case types::PrimitiveType::Int16:
1✔
20
            return "short";
1✔
21
        case types::PrimitiveType::Int32:
11✔
22
            return "int";
11✔
23
        case types::PrimitiveType::Int64:
1✔
24
            return "long long";
1✔
25
        case types::PrimitiveType::Int128:
×
26
            return "__int128";
×
27
        case types::PrimitiveType::UInt8:
3✔
28
            return "char";
3✔
29
        case types::PrimitiveType::UInt16:
1✔
30
            return "unsigned short";
1✔
31
        case types::PrimitiveType::UInt32:
1✔
32
            return "unsigned int";
1✔
33
        case types::PrimitiveType::UInt64:
1✔
34
            return "unsigned long long";
1✔
35
        case types::PrimitiveType::UInt128:
×
36
            return "unsigned __int128";
×
37
        case types::PrimitiveType::Half:
×
38
            return "__fp16";
×
39
        case types::PrimitiveType::BFloat:
×
40
            return "__bf16";
×
41
        case types::PrimitiveType::Float:
18✔
42
            return "float";
18✔
43
        case types::PrimitiveType::Double:
1✔
44
            return "double";
1✔
45
        case types::PrimitiveType::X86_FP80:
×
46
            return "long double";
×
47
        case types::PrimitiveType::FP128:
×
48
            return "__float128";
×
49
        case types::PrimitiveType::PPC_FP128:
×
50
            return "__float128";
×
51
    }
41✔
52

53
    throw std::runtime_error("Unknown primitive type");
×
54
};
41✔
55

56
std::string CUDALanguageExtension::
57
    declaration(const std::string& name, const types::IType& type, bool use_initializer, bool use_alignment) {
47✔
58
    std::stringstream val;
47✔
59

60
    if (auto scalar_type = dynamic_cast<const types::Scalar*>(&type)) {
47✔
61
        if (scalar_type->storage_type().is_nv_shared()) {
29✔
62
            val << "__shared__ ";
×
63
        } else if (scalar_type->storage_type().is_nv_constant()) {
29✔
64
            val << "__constant__ ";
×
65
        }
×
66
        val << primitive_type(scalar_type->primitive_type());
29✔
67
        val << " ";
29✔
68
        val << name;
29✔
69
    } else if (auto array_type = dynamic_cast<const types::Array*>(&type)) {
29✔
70
        if (array_type->storage_type().is_nv_shared()) {
3✔
71
            val << "__shared__ ";
×
72
        }
×
73
        auto& element_type = array_type->element_type();
3✔
74
        val << declaration(name + "[" + this->expression(array_type->num_elements()) + "]", element_type);
3✔
75
    } else if (auto pointer_type = dynamic_cast<const types::Pointer*>(&type)) {
15✔
76
        if (pointer_type->has_pointee_type()) {
12✔
77
            const types::IType& pointee = pointer_type->pointee_type();
11✔
78

79
            const bool pointee_is_function_or_array = dynamic_cast<const types::Function*>(&pointee) ||
11✔
80
                                                      dynamic_cast<const types::Array*>(&pointee);
11✔
81

82
            // Parenthesise *only* when it is needed to bind tighter than [] or ()
83
            std::string decorated = pointee_is_function_or_array ? "(*" + name + ")" : "*" + name;
11✔
84

85
            val << declaration(decorated, pointee);
11✔
86
        } else {
11✔
87
            val << "void*";
1✔
88
            val << " " << name;
1✔
89
        }
1✔
90
    } else if (auto ref_type = dynamic_cast<const Reference*>(&type)) {
12✔
91
        val << declaration("&" + name, ref_type->reference_type());
×
92
    } else if (auto structure_type = dynamic_cast<const types::Structure*>(&type)) {
3✔
93
        if (structure_type->storage_type().is_nv_shared()) {
3✔
94
            val << "__shared__ ";
×
95
        } else if (structure_type->storage_type().is_nv_constant()) {
3✔
96
            val << "__constant__ ";
×
97
        }
×
98
        val << structure_type->name();
3✔
99
        val << " ";
3✔
100
        val << name;
3✔
101
    } else if (auto function_type = dynamic_cast<const types::Function*>(&type)) {
3✔
102
        std::stringstream params;
×
103
        for (size_t i = 0; i < function_type->num_params(); ++i) {
×
104
            params << declaration("", function_type->param_type(symbolic::integer(i)));
×
105
            if (i + 1 < function_type->num_params()) params << ", ";
×
106
        }
×
107
        if (function_type->is_var_arg()) {
×
108
            if (function_type->num_params() > 0) {
×
109
                params << ", ";
×
110
            }
×
111
            params << "...";
×
112
        }
×
113

114
        const std::string fun_name = name + "(" + params.str() + ")";
×
115
        val << declaration(fun_name, function_type->return_type());
×
116
    } else {
×
117
        throw std::runtime_error("Unknown declaration type");
×
118
    }
×
119

120
    if (use_alignment && type.alignment() > 0) {
47✔
121
        val << " __attribute__((aligned(" << type.alignment() << ")))";
×
122
    }
×
123

124
    if (use_initializer && !type.initializer().empty()) {
47✔
125
        val << " = " << type.initializer();
×
126
    }
×
127

128
    return val.str();
47✔
129
};
47✔
130

131
std::string CUDALanguageExtension::type_cast(const std::string& name, const types::IType& type) {
5✔
132
    std::stringstream val;
5✔
133

134
    val << "reinterpret_cast";
5✔
135
    val << "<";
5✔
136
    val << declaration("", type);
5✔
137
    val << ">";
5✔
138
    val << "(" << name << ")";
5✔
139

140
    return val.str();
5✔
141
};
5✔
142

143
std::string CUDALanguageExtension::subset(const types::IType& type, const data_flow::Subset& sub) {
15✔
144
    if (sub.empty()) {
15✔
145
        return "";
9✔
146
    }
9✔
147

148
    if (dynamic_cast<const types::Scalar*>(&type)) {
6✔
149
        return "";
×
150
    } else if (auto array_type = dynamic_cast<const types::Array*>(&type)) {
6✔
151
        std::string subset_str = "[" + this->expression(sub.at(0)) + "]";
1✔
152

153
        if (sub.size() > 1) {
1✔
154
            data_flow::Subset element_subset(sub.begin() + 1, sub.end());
×
155
            auto& element_type = array_type->element_type();
×
156
            return subset_str + subset(element_type, element_subset);
×
157
        } else {
1✔
158
            return subset_str;
1✔
159
        }
1✔
160
    } else if (auto pointer_type = dynamic_cast<const types::Pointer*>(&type)) {
5✔
161
        std::string subset_str = "[" + this->expression(sub.at(0)) + "]";
4✔
162

163
        data_flow::Subset element_subset(sub.begin() + 1, sub.end());
4✔
164
        auto& pointee_type = pointer_type->pointee_type();
4✔
165
        return subset_str + subset(pointee_type, element_subset);
4✔
166
    } else if (auto structure_type = dynamic_cast<const types::Structure*>(&type)) {
4✔
167
        auto& definition = this->function_.structure(structure_type->name());
1✔
168

169
        std::string subset_str = ".member_" + this->expression(sub.at(0));
1✔
170
        if (sub.size() > 1) {
1✔
171
            auto member = SymEngine::rcp_dynamic_cast<const SymEngine::Integer>(sub.at(0));
×
172
            auto& member_type = definition.member_type(member);
×
173
            data_flow::Subset element_subset(sub.begin() + 1, sub.end());
×
174
            return subset_str + subset(member_type, element_subset);
×
175
        } else {
1✔
176
            return subset_str;
1✔
177
        }
1✔
178
    }
1✔
179

180
    throw std::invalid_argument("Invalid subset type");
×
181
};
6✔
182

183
std::string CUDALanguageExtension::expression(const symbolic::Expression expr) {
17✔
184
    CPPSymbolicPrinter printer(this->function_, this->external_prefix_);
17✔
185
    return printer.apply(expr);
17✔
186
};
17✔
187

188
std::string CUDALanguageExtension::access_node(const data_flow::AccessNode& node) {
8✔
189
    if (dynamic_cast<const data_flow::ConstantNode*>(&node)) {
8✔
190
        std::string name = node.data();
4✔
191
        if (symbolic::is_nullptr(symbolic::symbol(name))) {
4✔
192
            return "nullptr";
×
193
        }
×
194
        return name;
4✔
195
    } else {
4✔
196
        std::string name = node.data();
4✔
197
        if (this->function_.is_external(name)) {
4✔
198
            return "(&" + name + ")";
×
199
        }
×
200
        return name;
4✔
201
    }
4✔
202
};
8✔
203

204
std::string CUDALanguageExtension::tasklet(const data_flow::Tasklet& tasklet) {
4✔
205
    switch (tasklet.code()) {
4✔
206
        case data_flow::TaskletCode::assign:
4✔
207
            return tasklet.inputs().at(0);
4✔
208
        case data_flow::TaskletCode::fp_neg:
×
209
            return "-" + tasklet.inputs().at(0);
×
210
        case data_flow::TaskletCode::fp_add:
×
211
            return tasklet.inputs().at(0) + " + " + tasklet.inputs().at(1);
×
212
        case data_flow::TaskletCode::fp_sub:
×
213
            return tasklet.inputs().at(0) + " - " + tasklet.inputs().at(1);
×
214
        case data_flow::TaskletCode::fp_mul:
×
215
            return tasklet.inputs().at(0) + " * " + tasklet.inputs().at(1);
×
216
        case data_flow::TaskletCode::fp_div:
×
217
            return tasklet.inputs().at(0) + " / " + tasklet.inputs().at(1);
×
218
        case data_flow::TaskletCode::fp_rem:
×
NEW
219
            return "fmod(" + tasklet.inputs().at(0) + ", " + tasklet.inputs().at(1) + ")";
×
220
        case data_flow::TaskletCode::fp_fma:
×
221
            return tasklet.inputs().at(0) + " * " + tasklet.inputs().at(1) + " + " + tasklet.inputs().at(2);
×
222
        case data_flow::TaskletCode::fp_oeq:
×
223
            return tasklet.inputs().at(0) + " == " + tasklet.inputs().at(1);
×
224
        case data_flow::TaskletCode::fp_one:
×
225
            return tasklet.inputs().at(0) + " != " + tasklet.inputs().at(1);
×
226
        case data_flow::TaskletCode::fp_ogt:
×
227
            return tasklet.inputs().at(0) + " > " + tasklet.inputs().at(1);
×
228
        case data_flow::TaskletCode::fp_oge:
×
229
            return tasklet.inputs().at(0) + " >= " + tasklet.inputs().at(1);
×
230
        case data_flow::TaskletCode::fp_olt:
×
231
            return tasklet.inputs().at(0) + " < " + tasklet.inputs().at(1);
×
232
        case data_flow::TaskletCode::fp_ole:
×
233
            return tasklet.inputs().at(0) + " <= " + tasklet.inputs().at(1);
×
234
        case data_flow::TaskletCode::fp_ord:
×
235
            return "std::isnan(" + tasklet.inputs().at(0) + ") && std::isnan(" + tasklet.inputs().at(1) + ")";
×
236
        case data_flow::TaskletCode::fp_ueq:
×
237
            return "std::isnan(" + tasklet.inputs().at(0) + ") || std::isnan(" + tasklet.inputs().at(1) + ")" + " || " +
×
238
                   tasklet.inputs().at(0) + " == " + tasklet.inputs().at(1);
×
239
        case data_flow::TaskletCode::fp_une:
×
240
            return "std::isnan(" + tasklet.inputs().at(0) + ") || std::isnan(" + tasklet.inputs().at(1) + ")" + " || " +
×
241
                   tasklet.inputs().at(0) + " != " + tasklet.inputs().at(1);
×
242
        case data_flow::TaskletCode::fp_ugt:
×
243
            return "std::isnan(" + tasklet.inputs().at(0) + ") || std::isnan(" + tasklet.inputs().at(1) + ")" + " || " +
×
244
                   tasklet.inputs().at(0) + " > " + tasklet.inputs().at(1);
×
245
        case data_flow::TaskletCode::fp_uge:
×
246
            return "std::isnan(" + tasklet.inputs().at(0) + ") || std::isnan(" + tasklet.inputs().at(1) + ")" + " || " +
×
247
                   tasklet.inputs().at(0) + " >= " + tasklet.inputs().at(1);
×
248
        case data_flow::TaskletCode::fp_ult:
×
249
            return "std::isnan(" + tasklet.inputs().at(0) + ") || std::isnan(" + tasklet.inputs().at(1) + ")" + " || " +
×
250
                   tasklet.inputs().at(0) + " < " + tasklet.inputs().at(1);
×
251
        case data_flow::TaskletCode::fp_ule:
×
252
            return "std::isnan(" + tasklet.inputs().at(0) + ") || std::isnan(" + tasklet.inputs().at(1) + ")" + " || " +
×
253
                   tasklet.inputs().at(0) + " <= " + tasklet.inputs().at(1);
×
254
        case data_flow::TaskletCode::fp_uno:
×
255
            return "std::isnan(" + tasklet.inputs().at(0) + ") || std::isnan(" + tasklet.inputs().at(1) + ")";
×
256
        case data_flow::TaskletCode::int_add:
×
257
            return tasklet.inputs().at(0) + " + " + tasklet.inputs().at(1);
×
258
        case data_flow::TaskletCode::int_sub:
×
259
            return tasklet.inputs().at(0) + " - " + tasklet.inputs().at(1);
×
260
        case data_flow::TaskletCode::int_mul:
×
261
            return tasklet.inputs().at(0) + " * " + tasklet.inputs().at(1);
×
262
        case data_flow::TaskletCode::int_sdiv:
×
263
            return tasklet.inputs().at(0) + " / " + tasklet.inputs().at(1);
×
264
        case data_flow::TaskletCode::int_srem:
×
265
            return tasklet.inputs().at(0) + " % " + tasklet.inputs().at(1);
×
266
        case data_flow::TaskletCode::int_udiv:
×
267
            return tasklet.inputs().at(0) + " / " + tasklet.inputs().at(1);
×
268
        case data_flow::TaskletCode::int_urem:
×
269
            return tasklet.inputs().at(0) + " % " + tasklet.inputs().at(1);
×
270
        case data_flow::TaskletCode::int_and:
×
271
            return tasklet.inputs().at(0) + " & " + tasklet.inputs().at(1);
×
272
        case data_flow::TaskletCode::int_or:
×
273
            return tasklet.inputs().at(0) + " | " + tasklet.inputs().at(1);
×
274
        case data_flow::TaskletCode::int_xor:
×
275
            return tasklet.inputs().at(0) + " ^ " + tasklet.inputs().at(1);
×
276
        case data_flow::TaskletCode::int_shl:
×
277
            return tasklet.inputs().at(0) + " << " + tasklet.inputs().at(1);
×
278
        case data_flow::TaskletCode::int_lshr:
×
279
            return tasklet.inputs().at(0) + " >> " + tasklet.inputs().at(1);
×
280
        case data_flow::TaskletCode::int_ashr:
×
281
            return tasklet.inputs().at(0) + " >> " + tasklet.inputs().at(1);
×
282
        case data_flow::TaskletCode::int_smin:
×
283
            return tasklet.inputs().at(0) + " < " + tasklet.inputs().at(1) + " ? " + tasklet.inputs().at(0) + " : " +
×
284
                   tasklet.inputs().at(1);
×
285
        case data_flow::TaskletCode::int_smax:
×
286
            return tasklet.inputs().at(0) + " > " + tasklet.inputs().at(1) + " ? " + tasklet.inputs().at(0) + " : " +
×
287
                   tasklet.inputs().at(1);
×
288
        case data_flow::TaskletCode::int_scmp:
×
289
            return tasklet.inputs().at(0) + " < " + tasklet.inputs().at(1) + " ? -1 : (" + tasklet.inputs().at(0) +
×
290
                   " > " + tasklet.inputs().at(1) + " ? 1 : 0)";
×
291
        case data_flow::TaskletCode::int_umin:
×
292
            return tasklet.inputs().at(0) + " < " + tasklet.inputs().at(1) + " ? " + tasklet.inputs().at(0) + " : " +
×
293
                   tasklet.inputs().at(1);
×
294
        case data_flow::TaskletCode::int_umax:
×
295
            return tasklet.inputs().at(0) + " > " + tasklet.inputs().at(1) + " ? " + tasklet.inputs().at(0) + " : " +
×
296
                   tasklet.inputs().at(1);
×
297
        case data_flow::TaskletCode::int_ucmp:
×
298
            return tasklet.inputs().at(0) + " < " + tasklet.inputs().at(1) + " ? -1 : (" + tasklet.inputs().at(0) +
×
299
                   " > " + tasklet.inputs().at(1) + " ? 1 : 0)";
×
300
        case data_flow::TaskletCode::int_abs:
×
301
            return "(" + tasklet.inputs().at(0) + " < 0 ? -" + tasklet.inputs().at(0) + " : " + tasklet.inputs().at(0) +
×
302
                   ")";
×
303
        case data_flow::TaskletCode::int_eq:
×
304
            return tasklet.inputs().at(0) + " == " + tasklet.inputs().at(1);
×
305
        case data_flow::TaskletCode::int_ne:
×
306
            return tasklet.inputs().at(0) + " != " + tasklet.inputs().at(1);
×
307
        case data_flow::TaskletCode::int_sgt:
×
308
            return tasklet.inputs().at(0) + " > " + tasklet.inputs().at(1);
×
309
        case data_flow::TaskletCode::int_sge:
×
310
            return tasklet.inputs().at(0) + " >= " + tasklet.inputs().at(1);
×
311
        case data_flow::TaskletCode::int_slt:
×
312
            return tasklet.inputs().at(0) + " < " + tasklet.inputs().at(1);
×
313
        case data_flow::TaskletCode::int_sle:
×
314
            return tasklet.inputs().at(0) + " <= " + tasklet.inputs().at(1);
×
315
        case data_flow::TaskletCode::int_ugt:
×
316
            return tasklet.inputs().at(0) + " > " + tasklet.inputs().at(1);
×
317
        case data_flow::TaskletCode::int_uge:
×
318
            return tasklet.inputs().at(0) + " >= " + tasklet.inputs().at(1);
×
319
        case data_flow::TaskletCode::int_ult:
×
320
            return tasklet.inputs().at(0) + " < " + tasklet.inputs().at(1);
×
321
        case data_flow::TaskletCode::int_ule:
×
322
            return tasklet.inputs().at(0) + " <= " + tasklet.inputs().at(1);
×
323
    };
4✔
324
    throw std::invalid_argument("Invalid tasklet code");
×
325
};
4✔
326

327
std::string CUDALanguageExtension::zero(const types::PrimitiveType prim_type) {
×
328
    switch (prim_type) {
×
329
        case types::Void:
×
330
            throw InvalidSDFGException("No zero for void type possible");
×
331
        case types::Bool:
×
332
            return "false";
×
333
        case types::Int8:
×
334
            return "0";
×
335
        case types::Int16:
×
336
            return "0";
×
337
        case types::Int32:
×
338
            return "0";
×
339
        case types::Int64:
×
340
            return "0ll";
×
341
        case types::Int128:
×
342
            return "0";
×
343
        case types::UInt8:
×
344
            return "0u";
×
345
        case types::UInt16:
×
346
            return "0u";
×
347
        case types::UInt32:
×
348
            return "0u";
×
349
        case types::UInt64:
×
350
            return "0ull";
×
351
        case types::UInt128:
×
352
            return "0";
×
353
        case types::Half:
×
354
            return "CUDART_ZERO_FP16";
×
355
        case types::BFloat:
×
356
            return "CUDART_ZERO_BF16";
×
357
        case types::Float:
×
358
            return "0.0f";
×
359
        case types::Double:
×
360
            return "0.0";
×
361
        case types::X86_FP80:
×
362
            return "0.0l";
×
363
        case types::FP128:
×
364
            return "0.0";
×
365
        case types::PPC_FP128:
×
366
            return "0.0";
×
367
    }
×
368
}
×
369

370
} // namespace codegen
371
} // namespace sdfg
STATUS · Troubleshooting · Open an Issue · Sales · Support · CAREERS · ENTERPRISE · START FREE · SCHEDULE DEMO
ANNOUNCEMENTS · TWITTER · TOS & SLA · Supported CI Services · What's a CI service? · Automated Testing

© 2026 Coveralls, Inc