@@ -120,8 +120,8 @@ template <typename InputTorus>
120120void cuda_multi_bit_programmable_bootstrap_lwe_ciphertext_vector_128 (
121121 void *stream, uint32_t gpu_index, __uint128_t *lwe_array_out,
122122 InputTorus const *lwe_output_indexes, __uint128_t const *lut_vector,
123- InputTorus const *lut_vector_indexes , InputTorus const *lwe_array_in ,
124- InputTorus const *lwe_input_indexes, __uint128_t const *bootstrapping_key,
123+ InputTorus const *lwe_array_in , InputTorus const *lwe_input_indexes ,
124+ __uint128_t const *bootstrapping_key,
125125 pbs_buffer_128<InputTorus, MULTI_BIT> *pbs_buffer, uint32_t lwe_dimension,
126126 uint32_t glwe_dimension, uint32_t polynomial_size, uint32_t grouping_factor,
127127 uint32_t base_log, uint32_t level_count, uint32_t num_samples,
@@ -131,45 +131,45 @@ void cuda_multi_bit_programmable_bootstrap_lwe_ciphertext_vector_128(
131131 case 256 :
132132 host_multi_bit_programmable_bootstrap_128<InputTorus, AmortizedDegree<256 >>(
133133 static_cast <cudaStream_t>(stream), gpu_index, lwe_array_out,
134- lwe_output_indexes, lut_vector, lut_vector_indexes, lwe_array_in ,
135- lwe_input_indexes, bootstrapping_key, pbs_buffer, glwe_dimension,
136- lwe_dimension, polynomial_size, grouping_factor, base_log, level_count,
137- num_samples, num_many_lut, lut_stride);
134+ lwe_output_indexes, lut_vector, lwe_array_in, lwe_input_indexes ,
135+ bootstrapping_key, pbs_buffer, glwe_dimension, lwe_dimension ,
136+ polynomial_size, grouping_factor, base_log, level_count, num_samples ,
137+ num_many_lut, lut_stride);
138138 break ;
139139 case 512 :
140140 host_multi_bit_programmable_bootstrap_128<InputTorus, AmortizedDegree<512 >>(
141141 static_cast <cudaStream_t>(stream), gpu_index, lwe_array_out,
142- lwe_output_indexes, lut_vector, lut_vector_indexes, lwe_array_in ,
143- lwe_input_indexes, bootstrapping_key, pbs_buffer, glwe_dimension,
144- lwe_dimension, polynomial_size, grouping_factor, base_log, level_count,
145- num_samples, num_many_lut, lut_stride);
142+ lwe_output_indexes, lut_vector, lwe_array_in, lwe_input_indexes ,
143+ bootstrapping_key, pbs_buffer, glwe_dimension, lwe_dimension ,
144+ polynomial_size, grouping_factor, base_log, level_count, num_samples ,
145+ num_many_lut, lut_stride);
146146 break ;
147147 case 1024 :
148148 host_multi_bit_programmable_bootstrap_128<InputTorus,
149149 AmortizedDegree<1024 >>(
150150 static_cast <cudaStream_t>(stream), gpu_index, lwe_array_out,
151- lwe_output_indexes, lut_vector, lut_vector_indexes, lwe_array_in ,
152- lwe_input_indexes, bootstrapping_key, pbs_buffer, glwe_dimension,
153- lwe_dimension, polynomial_size, grouping_factor, base_log, level_count,
154- num_samples, num_many_lut, lut_stride);
151+ lwe_output_indexes, lut_vector, lwe_array_in, lwe_input_indexes ,
152+ bootstrapping_key, pbs_buffer, glwe_dimension, lwe_dimension ,
153+ polynomial_size, grouping_factor, base_log, level_count, num_samples ,
154+ num_many_lut, lut_stride);
155155 break ;
156156 case 2048 :
157157 host_multi_bit_programmable_bootstrap_128<InputTorus,
158158 AmortizedDegree<2048 >>(
159159 static_cast <cudaStream_t>(stream), gpu_index, lwe_array_out,
160- lwe_output_indexes, lut_vector, lut_vector_indexes, lwe_array_in ,
161- lwe_input_indexes, bootstrapping_key, pbs_buffer, glwe_dimension,
162- lwe_dimension, polynomial_size, grouping_factor, base_log, level_count,
163- num_samples, num_many_lut, lut_stride);
160+ lwe_output_indexes, lut_vector, lwe_array_in, lwe_input_indexes ,
161+ bootstrapping_key, pbs_buffer, glwe_dimension, lwe_dimension ,
162+ polynomial_size, grouping_factor, base_log, level_count, num_samples ,
163+ num_many_lut, lut_stride);
164164 break ;
165165 case 4096 :
166166 host_multi_bit_programmable_bootstrap_128<InputTorus,
167167 AmortizedDegree<4096 >>(
168168 static_cast <cudaStream_t>(stream), gpu_index, lwe_array_out,
169- lwe_output_indexes, lut_vector, lut_vector_indexes, lwe_array_in ,
170- lwe_input_indexes, bootstrapping_key, pbs_buffer, glwe_dimension,
171- lwe_dimension, polynomial_size, grouping_factor, base_log, level_count,
172- num_samples, num_many_lut, lut_stride);
169+ lwe_output_indexes, lut_vector, lwe_array_in, lwe_input_indexes ,
170+ bootstrapping_key, pbs_buffer, glwe_dimension, lwe_dimension ,
171+ polynomial_size, grouping_factor, base_log, level_count, num_samples ,
172+ num_many_lut, lut_stride);
173173 break ;
174174 default :
175175 PANIC (" Cuda error (multi-bit PBS): unsupported polynomial size. Supported "
@@ -182,8 +182,8 @@ template <typename InputTorus>
182182void cuda_cg_multi_bit_programmable_bootstrap_lwe_ciphertext_vector_128 (
183183 void *stream, uint32_t gpu_index, __uint128_t *lwe_array_out,
184184 InputTorus const *lwe_output_indexes, __uint128_t const *lut_vector,
185- InputTorus const *lut_vector_indexes , InputTorus const *lwe_array_in ,
186- InputTorus const *lwe_input_indexes, __uint128_t const *bootstrapping_key,
185+ InputTorus const *lwe_array_in , InputTorus const *lwe_input_indexes ,
186+ __uint128_t const *bootstrapping_key,
187187 pbs_buffer_128<InputTorus, MULTI_BIT> *pbs_buffer, uint32_t lwe_dimension,
188188 uint32_t glwe_dimension, uint32_t polynomial_size, uint32_t grouping_factor,
189189 uint32_t base_log, uint32_t level_count, uint32_t num_samples,
@@ -194,46 +194,46 @@ void cuda_cg_multi_bit_programmable_bootstrap_lwe_ciphertext_vector_128(
194194 host_cg_multi_bit_programmable_bootstrap_128<InputTorus,
195195 AmortizedDegree<256 >>(
196196 static_cast <cudaStream_t>(stream), gpu_index, lwe_array_out,
197- lwe_output_indexes, lut_vector, lut_vector_indexes, lwe_array_in ,
198- lwe_input_indexes, bootstrapping_key, pbs_buffer, glwe_dimension,
199- lwe_dimension, polynomial_size, grouping_factor, base_log, level_count,
200- num_samples, num_many_lut, lut_stride);
197+ lwe_output_indexes, lut_vector, lwe_array_in, lwe_input_indexes ,
198+ bootstrapping_key, pbs_buffer, glwe_dimension, lwe_dimension ,
199+ polynomial_size, grouping_factor, base_log, level_count, num_samples ,
200+ num_many_lut, lut_stride);
201201 break ;
202202 case 512 :
203203 host_cg_multi_bit_programmable_bootstrap_128<InputTorus,
204204 AmortizedDegree<512 >>(
205205 static_cast <cudaStream_t>(stream), gpu_index, lwe_array_out,
206- lwe_output_indexes, lut_vector, lut_vector_indexes, lwe_array_in ,
207- lwe_input_indexes, bootstrapping_key, pbs_buffer, glwe_dimension,
208- lwe_dimension, polynomial_size, grouping_factor, base_log, level_count,
209- num_samples, num_many_lut, lut_stride);
206+ lwe_output_indexes, lut_vector, lwe_array_in, lwe_input_indexes ,
207+ bootstrapping_key, pbs_buffer, glwe_dimension, lwe_dimension ,
208+ polynomial_size, grouping_factor, base_log, level_count, num_samples ,
209+ num_many_lut, lut_stride);
210210 break ;
211211 case 1024 :
212212 host_cg_multi_bit_programmable_bootstrap_128<InputTorus,
213213 AmortizedDegree<1024 >>(
214214 static_cast <cudaStream_t>(stream), gpu_index, lwe_array_out,
215- lwe_output_indexes, lut_vector, lut_vector_indexes, lwe_array_in ,
216- lwe_input_indexes, bootstrapping_key, pbs_buffer, glwe_dimension,
217- lwe_dimension, polynomial_size, grouping_factor, base_log, level_count,
218- num_samples, num_many_lut, lut_stride);
215+ lwe_output_indexes, lut_vector, lwe_array_in, lwe_input_indexes ,
216+ bootstrapping_key, pbs_buffer, glwe_dimension, lwe_dimension ,
217+ polynomial_size, grouping_factor, base_log, level_count, num_samples ,
218+ num_many_lut, lut_stride);
219219 break ;
220220 case 2048 :
221221 host_cg_multi_bit_programmable_bootstrap_128<InputTorus,
222222 AmortizedDegree<2048 >>(
223223 static_cast <cudaStream_t>(stream), gpu_index, lwe_array_out,
224- lwe_output_indexes, lut_vector, lut_vector_indexes, lwe_array_in ,
225- lwe_input_indexes, bootstrapping_key, pbs_buffer, glwe_dimension,
226- lwe_dimension, polynomial_size, grouping_factor, base_log, level_count,
227- num_samples, num_many_lut, lut_stride);
224+ lwe_output_indexes, lut_vector, lwe_array_in, lwe_input_indexes ,
225+ bootstrapping_key, pbs_buffer, glwe_dimension, lwe_dimension ,
226+ polynomial_size, grouping_factor, base_log, level_count, num_samples ,
227+ num_many_lut, lut_stride);
228228 break ;
229229 case 4096 :
230230 host_cg_multi_bit_programmable_bootstrap_128<InputTorus,
231231 AmortizedDegree<4096 >>(
232232 static_cast <cudaStream_t>(stream), gpu_index, lwe_array_out,
233- lwe_output_indexes, lut_vector, lut_vector_indexes, lwe_array_in ,
234- lwe_input_indexes, bootstrapping_key, pbs_buffer, glwe_dimension,
235- lwe_dimension, polynomial_size, grouping_factor, base_log, level_count,
236- num_samples, num_many_lut, lut_stride);
233+ lwe_output_indexes, lut_vector, lwe_array_in, lwe_input_indexes ,
234+ bootstrapping_key, pbs_buffer, glwe_dimension, lwe_dimension ,
235+ polynomial_size, grouping_factor, base_log, level_count, num_samples ,
236+ num_many_lut, lut_stride);
237237 break ;
238238 default :
239239 PANIC (" Cuda error (multi-bit PBS): unsupported polynomial size. Supported "
@@ -245,12 +245,11 @@ void cuda_cg_multi_bit_programmable_bootstrap_lwe_ciphertext_vector_128(
245245void cuda_multi_bit_programmable_bootstrap_lwe_ciphertext_vector_128 (
246246 void *stream, uint32_t gpu_index, void *lwe_array_out,
247247 void const *lwe_output_indexes, void const *lut_vector,
248- void const *lut_vector_indexes, void const *lwe_array_in,
249- void const *lwe_input_indexes, void const *bootstrapping_key,
250- int8_t *mem_ptr, uint32_t lwe_dimension, uint32_t glwe_dimension,
251- uint32_t polynomial_size, uint32_t grouping_factor, uint32_t base_log,
252- uint32_t level_count, uint32_t num_samples, uint32_t num_many_lut,
253- uint32_t lut_stride) {
248+ void const *lwe_array_in, void const *lwe_input_indexes,
249+ void const *bootstrapping_key, int8_t *mem_ptr, uint32_t lwe_dimension,
250+ uint32_t glwe_dimension, uint32_t polynomial_size, uint32_t grouping_factor,
251+ uint32_t base_log, uint32_t level_count, uint32_t num_samples,
252+ uint32_t num_many_lut, uint32_t lut_stride) {
254253
255254 if (base_log > 64 )
256255 PANIC (" Cuda error (multi-bit PBS): base log should be <= 64" )
@@ -263,7 +262,6 @@ void cuda_multi_bit_programmable_bootstrap_lwe_ciphertext_vector_128(
263262 uint64_t >(stream, gpu_index, static_cast <__uint128_t *>(lwe_array_out),
264263 static_cast <const uint64_t *>(lwe_output_indexes),
265264 static_cast <const __uint128_t *>(lut_vector),
266- static_cast <const uint64_t *>(lut_vector_indexes),
267265 static_cast <const uint64_t *>(lwe_array_in),
268266 static_cast <const uint64_t *>(lwe_input_indexes),
269267 static_cast <const __uint128_t *>(bootstrapping_key), buffer,
@@ -276,7 +274,6 @@ void cuda_multi_bit_programmable_bootstrap_lwe_ciphertext_vector_128(
276274 stream, gpu_index, static_cast <__uint128_t *>(lwe_array_out),
277275 static_cast <const uint64_t *>(lwe_output_indexes),
278276 static_cast <const __uint128_t *>(lut_vector),
279- static_cast <const uint64_t *>(lut_vector_indexes),
280277 static_cast <const uint64_t *>(lwe_array_in),
281278 static_cast <const uint64_t *>(lwe_input_indexes),
282279 static_cast <const __uint128_t *>(bootstrapping_key), buffer,
0 commit comments