Intel® DPC++ Compatibility Tool Developer Guide and Reference
ID
768918
Date
6/24/2024
Public
A newer version of this document is available. Customers should click here to go to the newest version.
DPCT1000
DPCT1001
DPCT1002
DPCT1003
DPCT1004
DPCT1005
DPCT1006
DPCT1007
DPCT1008
DPCT1009
DPCT1010
DPCT1011
DPCT1012
DPCT1013
DPCT1014
DPCT1015
DPCT1016
DPCT1017
DPCT1018
DPCT1019
DPCT1020
DPCT1021
DPCT1022
DPCT1023
DPCT1024
DPCT1025
DPCT1026
DPCT1027
DPCT1028
DPCT1029
DPCT1030
DPCT1031
DPCT1032
DPCT1033
DPCT1034
DPCT1035
DPCT1036
DPCT1037
DPCT1038
DPCT1039
DPCT1040
DPCT1041
DPCT1042
DPCT1043
DPCT1044
DPCT1045
DPCT1046
DPCT1047
DPCT1048
DPCT1049
DPCT1050
DPCT1051
DPCT1052
DPCT1053
DPCT1054
DPCT1055
DPCT1056
DPCT1057
DPCT1058
DPCT1059
DPCT1060
DPCT1061
DPCT1062
DPCT1063
DPCT1064
DPCT1065
DPCT1066
DPCT1067
DPCT1068
DPCT1069
DPCT1070
DPCT1071
DPCT1072
DPCT1073
DPCT1074
DPCT1075
DPCT1076
DPCT1077
DPCT1078
DPCT1079
DPCT1080
DPCT1081
DPCT1082
DPCT1083
DPCT1084
Message
Detailed Help
Suggestions to Fix
DPCT1085
DPCT1086
DPCT1087
DPCT1088
DPCT1089
DPCT1090
DPCT1091
DPCT1092
DPCT1093
DPCT1094
DPCT1095
DPCT1096
DPCT1097
DPCT1098
DPCT1099
DPCT1100
DPCT1101
DPCT1102
DPCT1103
DPCT1104
DPCT1105
DPCT1106
DPCT1107
DPCT1108
DPCT1109
DPCT1110
DPCT1111
DPCT1112
DPCT1113
DPCT1114
DPCT1115
DPCT1116
DPCT1117
DPCT1118
DPCT1119
DPCT1120
DPCT1121
DPCT1122
DPCT1123
DPCT1124
DPCT1125
DPCT1126
DPCT1127
DPCT1128
DPCT1129
DPCT2001
DPCT3000
DPCT1084
Message
The function call <function name> has multiple migration results in different template instantiations that could not be unified. You may need to adjust the code.
Detailed Help
Intel® DPC++ Compatibility Tool was unable to migrate the code correctly. Modify the code manually.
The following example shows original code, migrated code, and the manual changes made to correct the migrated code.
For example, this original CUDA* code:
__constant__ int4 example_i[32];
__constant__ float4 example_f[32];
struct example_int {
__device__ int4 foo(int idx) const { return example_i[idx]; }
};
struct example_float {
__device__ float4 foo(int idx) const { return example_f[idx]; }
};
template <typename T> __global__ void example_kernel() {
T example_v;
int idx = blockIdx.x * blockDim.x + threadIdx.x;
float j = example_v.foo(idx).x;
}
void foo() {
example_kernel<example_int><<<1, 1>>>();
example_kernel<example_float><<<1, 1>>>();
}
results in the following migrated SYCL* code:
static dpct::constant_memory<sycl::int4, 1> example_i(32);
static dpct::constant_memory<sycl::float4, 1> example_f(32);
struct example_int {
sycl::int4 foo(int idx, sycl::int4 const *example_i) const {
return example_i[idx];
}
};
struct example_float {
sycl::float4 foo(int idx, sycl::float4 const *example_f) const {
return example_f[idx];
}
};
template <typename T> void example_kernel(const sycl::nd_item<3> &item_ct1,
sycl::float4 const *example_f) {
T example_v;
int idx = item_ct1.get_group(2) * item_ct1.get_local_range(2) +
item_ct1.get_local_id(2);
/*
DPCT1084:0: The function call "example_int::foo" has multiple migration
results in different template instantiations that could not be unified. You
may need to adjust the code.
*/
float j = example_v.foo(idx).x();
}
void foo() {
dpct::device_ext &dev_ct1 = dpct::get_current_device();
sycl::queue &q_ct1 = dev_ct1.in_order_queue();
q_ct1.submit([&](sycl::handler &cgh) {
example_f.init();
auto example_f_ptr_ct1 = example_f.get_ptr();
cgh.parallel_for(
sycl::nd_range<3>(sycl::range<3>(1, 1, 1), sycl::range<3>(1, 1, 1)),
[=](sycl::nd_item<3> item_ct1) {
example_kernel<example_int>(item_ct1, example_f_ptr_ct1);
});
});
q_ct1.submit([&](sycl::handler &cgh) {
example_f.init();
auto example_f_ptr_ct1 = example_f.get_ptr();
cgh.parallel_for(
sycl::nd_range<3>(sycl::range<3>(1, 1, 1), sycl::range<3>(1, 1, 1)),
[=](sycl::nd_item<3> item_ct1) {
example_kernel<example_float>(item_ct1, example_f_ptr_ct1);
});
});
}
which is manually adjusted to:
static dpct::constant_memory<sycl::int4, 1> example_i(32);
static dpct::constant_memory<sycl::float4, 1> example_f(32);
struct example_int {
typedef sycl::int4 data_type;
sycl::int4 foo(int idx, sycl::int4 const *example_i) const {
return example_i[idx];
}
};
struct example_float {
typedef sycl::float4 data_type;
sycl::float4 foo(int idx, sycl::float4 const *example_f) const {
return example_f[idx];
}
};
template <typename T> void example_kernel(const sycl::nd_item<3> &item_ct1,
typename T::data_type const *example) {
T example_v;
int idx = item_ct1.get_group(2) * item_ct1.get_local_range(2) +
item_ct1.get_local_id(2);
float j = example_v.foo(idx, example).x();
}
void foo() {
dpct::device_ext &dev_ct1 = dpct::get_current_device();
sycl::queue &q_ct1 = dev_ct1.in_order_queue();
q_ct1.submit([&](sycl::handler &cgh) {
example_i.init();
auto example_i_ptr_ct1 = example_i.get_ptr();
cgh.parallel_for(
sycl::nd_range<3>(sycl::range<3>(1, 1, 1), sycl::range<3>(1, 1, 1)),
[=](sycl::nd_item<3> item_ct1) {
example_kernel<example_int>(item_ct1, example_i_ptr_ct1);
});
});
q_ct1.submit([&](sycl::handler &cgh) {
example_f.init();
auto example_f_ptr_ct1 = example_f.get_ptr();
cgh.parallel_for(
sycl::nd_range<3>(sycl::range<3>(1, 1, 1), sycl::range<3>(1, 1, 1)),
[=](sycl::nd_item<3> item_ct1) {
example_kernel<example_float>(item_ct1, example_f_ptr_ct1);
});
});
}
Suggestions to Fix
Code requires manual adjustment.