@@ -179,18 +179,18 @@ class committed_descriptor {
179
179
template <typename Scalar1, domain Domain1, direction Dir, detail::layout LayoutIn, detail::layout LayoutOut,
180
180
Idx SubgroupSize, typename TIn>
181
181
friend std::vector<sycl::event> detail::compute_level (
182
- const typename committed_descriptor<Scalar1, Domain1>::kernel_data_struct& kd_struct, TIn input, Scalar * output,
183
- const Scalar * twiddles_ptr, const IdxGlobal* factors_triple, Scalar scale_factor,
182
+ const typename committed_descriptor<Scalar1, Domain1>::kernel_data_struct& kd_struct, TIn input, Scalar1 * output,
183
+ const Scalar1 * twiddles_ptr, const IdxGlobal* factors_triple, Scalar1 scale_factor,
184
184
IdxGlobal intermediate_twiddle_offset, IdxGlobal subimpl_twiddle_offset, IdxGlobal input_global_offset,
185
185
IdxGlobal committed_size, Idx num_batches_in_l2, IdxGlobal n_transforms, IdxGlobal batch_start, Idx factor_id,
186
186
Idx total_factors, const std::vector<sycl::event>& dependencies, sycl::queue& queue);
187
187
188
188
template <typename Scalar1, domain Domain1, typename TOut>
189
189
friend sycl::event detail::transpose_level (
190
- const typename committed_descriptor<Scalar1, Domain1>::kernel_data_struct& kd_struct, const Scalar * input,
190
+ const typename committed_descriptor<Scalar1, Domain1>::kernel_data_struct& kd_struct, const Scalar1 * input,
191
191
TOut output, const IdxGlobal* factors_triple, IdxGlobal committed_size, Idx num_batches_in_l2,
192
192
IdxGlobal n_transforms, IdxGlobal batch_start, Idx factor_num, Idx total_factors, IdxGlobal output_offset,
193
- sycl::queue& queue, std::shared_ptr<Scalar >& ptr1, std::shared_ptr<Scalar >& ptr2,
193
+ sycl::queue& queue, std::shared_ptr<Scalar1 >& ptr1, std::shared_ptr<Scalar1 >& ptr2,
194
194
const std::vector<sycl::event>& events);
195
195
196
196
descriptor<Scalar, Domain> params;
0 commit comments