zama-ai
diff --git a/‎tfhe-benchmark/benches/boolean/bench.rs‎
Lines changed: 7 additions & 0 deletions b/‎tfhe-benchmark/benches/boolean/bench.rs‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎tfhe-benchmark/benches/core_crypto/ks_bench.rs‎
Lines changed: 8 additions & 0 deletions b/‎tfhe-benchmark/benches/core_crypto/ks_bench.rs‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎tfhe-benchmark/benches/core_crypto/ks_pbs_bench.rs‎
Lines changed: 8 additions & 0 deletions b/‎tfhe-benchmark/benches/core_crypto/ks_pbs_bench.rs‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎tfhe-benchmark/benches/core_crypto/modulus_switch_noise_reduction.rs‎
Lines changed: 1 addition & 0 deletions b/‎tfhe-benchmark/benches/core_crypto/modulus_switch_noise_reduction.rs‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎tfhe-benchmark/benches/core_crypto/pbs128_bench.rs‎
Lines changed: 4 additions & 0 deletions b/‎tfhe-benchmark/benches/core_crypto/pbs128_bench.rs‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎tfhe-benchmark/benches/core_crypto/pbs_bench.rs‎
Lines changed: 12 additions & 0 deletions b/‎tfhe-benchmark/benches/core_crypto/pbs_bench.rs‎
Lines changed: 12 additions & 0 deletions
@@ -51,30 +51,37 @@ fn benches(c: &mut Criterion, params: BooleanParameters, parameter_name: &str) {
     let ct3 = cks.encrypt(true);
 
     let id = format!("AND::{parameter_name}");
+    println!("{id}");
     bench_group.bench_function(&id, |b| b.iter(|| black_box(sks.and(&ct1, &ct2))));
     write_to_json_boolean(&id, params, parameter_name, "and");
 
     let id = format!("NAND::{parameter_name}");
+    println!("{id}");
     bench_group.bench_function(&id, |b| b.iter(|| black_box(sks.nand(&ct1, &ct2))));
     write_to_json_boolean(&id, params, parameter_name, "nand");
 
     let id = format!("OR::{parameter_name}");
+    println!("{id}");
     bench_group.bench_function(&id, |b| b.iter(|| black_box(sks.or(&ct1, &ct2))));
     write_to_json_boolean(&id, params, parameter_name, "or");
 
     let id = format!("XOR::{parameter_name}");
+    println!("{id}");
     bench_group.bench_function(&id, |b| b.iter(|| black_box(sks.xor(&ct1, &ct2))));
     write_to_json_boolean(&id, params, parameter_name, "xor");
 
     let id = format!("XNOR::{parameter_name}");
+    println!("{id}");
     bench_group.bench_function(&id, |b| b.iter(|| black_box(sks.xnor(&ct1, &ct2))));
     write_to_json_boolean(&id, params, parameter_name, "xnor");
 
     let id = format!("NOT::{parameter_name}");
+    println!("{id}");
     bench_group.bench_function(&id, |b| b.iter(|| black_box(sks.not(&ct1))));
     write_to_json_boolean(&id, params, parameter_name, "not");
 
     let id = format!("MUX::{parameter_name}");
+    println!("{id}");
     bench_group.bench_function(&id, |b| b.iter(|| black_box(sks.mux(&ct1, &ct2, &ct3))));
     write_to_json_boolean(&id, params, parameter_name, "mux");
 }
 
@@ -73,6 +73,7 @@ fn keyswitch<Scalar: UnsignedTorus + CastInto<usize> + Serialize>(
                 );
 
                 bench_id = format!("{bench_name}::{name}");
+                println!("{bench_id}");
                 {
                     bench_group.bench_function(&bench_id, |b| {
                         b.iter(|| {
@@ -84,6 +85,7 @@ fn keyswitch<Scalar: UnsignedTorus + CastInto<usize> + Serialize>(
             }
             BenchmarkType::Throughput => {
                 bench_id = format!("{bench_name}::throughput::{name}");
+                println!("{bench_id}");
                 let blocks: usize = 1;
                 let elements = throughput_num_threads(blocks, 1); // FIXME This number of element do not staturate the target machine
                 bench_group.throughput(Throughput::Elements(elements));
@@ -231,6 +233,7 @@ fn packing_keyswitch<Scalar, F>(
                 );
 
                 bench_id = format!("{bench_name}::{name}");
+                println!("{bench_id}");
                 {
                     bench_group.bench_function(&bench_id, |b| {
                         b.iter(|| {
@@ -242,6 +245,7 @@ fn packing_keyswitch<Scalar, F>(
             }
             BenchmarkType::Throughput => {
                 bench_id = format!("{bench_name}::throughput::{name}");
+                println!("{bench_id}");
                 let blocks: usize = 1;
                 let elements = throughput_num_threads(blocks, 1);
                 bench_group.throughput(Throughput::Elements(elements));
@@ -414,6 +418,7 @@ mod cuda {
                     let cuda_indexes = CudaIndexes::new(&h_indexes, &streams, 0);
 
                     bench_id = format!("{bench_name}::{name}");
+                    println!("{bench_id}");
                     {
                         bench_group.bench_function(&bench_id, |b| {
                             b.iter(|| {
@@ -435,6 +440,7 @@ mod cuda {
                     let gpu_count = get_number_of_gpus() as usize;
 
                     bench_id = format!("{bench_name}::throughput::{name}");
+                    println!("{bench_id}");
                     let blocks: usize = 1;
                     let elements = throughput_num_threads(blocks, 1);
                     let elements_per_stream = elements as usize / gpu_count;
@@ -644,6 +650,7 @@ mod cuda {
                     streams.synchronize();
 
                     bench_id = format!("{bench_name}::{name}");
+                    println!("{bench_id}");
                     {
                         bench_group.bench_function(&bench_id, |b| {
                             b.iter(|| {
@@ -663,6 +670,7 @@ mod cuda {
                     let gpu_count = get_number_of_gpus() as usize;
 
                     bench_id = format!("{bench_name}::throughput::{name}");
+                    println!("{bench_id}");
 
                     let mem_size = get_packing_keyswitch_list_64_size_on_gpu(
                         &CudaStreams::new_single_gpu(GpuIndex::new(0)),
 
@@ -111,6 +111,7 @@ fn ks_pbs<Scalar: UnsignedTorus + CastInto<usize> + Serialize>(
                 );
 
                 bench_id = format!("{bench_name}::{name}");
+                println!("{bench_id}");
                 {
                     bench_group.bench_function(&bench_id, |b| {
                         b.iter(|| {
@@ -134,6 +135,7 @@ fn ks_pbs<Scalar: UnsignedTorus + CastInto<usize> + Serialize>(
             }
             BenchmarkType::Throughput => {
                 bench_id = format!("{bench_name}::throughput::{name}");
+                println!("{bench_id}");
                 let blocks: usize = 1;
                 let elements = throughput_num_threads(blocks, 1);
                 println!("Number of elements: {elements}"); // DEBUG
@@ -370,6 +372,7 @@ fn multi_bit_ks_pbs<
                 );
 
                 bench_id = format!("{bench_name}::{name}::parallelized");
+                println!("{bench_id}");
                 bench_group.bench_function(&bench_id, |b| {
                     b.iter(|| {
                         keyswitch_lwe_ciphertext(
@@ -391,6 +394,7 @@ fn multi_bit_ks_pbs<
             }
             BenchmarkType::Throughput => {
                 bench_id = format!("{bench_name}::throughput::{name}");
+                println!("{bench_id}");
                 let blocks: usize = 1;
                 let elements = throughput_num_threads(blocks, 1);
                 println!("Number of elements: {elements}"); // DEBUG
@@ -621,6 +625,7 @@ mod cuda {
                     let cuda_indexes = CudaIndexes::new(&h_indexes, &streams, 0);
 
                     bench_id = format!("{bench_name}::{name}");
+                    println!("{bench_id}");
                     {
                         bench_group.bench_function(&bench_id, |b| {
                             b.iter(|| {
@@ -652,6 +657,7 @@ mod cuda {
                     let gpu_count = get_number_of_gpus() as usize;
 
                     bench_id = format!("{bench_name}::throughput::{name}");
+                    println!("{bench_id}");
                     let blocks: usize = 1;
                     let elements = throughput_num_threads(blocks, 1);
                     let elements_per_stream = elements as usize / gpu_count;
@@ -929,6 +935,7 @@ mod cuda {
                     let cuda_indexes = CudaIndexes::new(&h_indexes, &streams, 0);
 
                     bench_id = format!("{bench_name}::{name}");
+                    println!("{bench_id}");
                     bench_group.bench_function(&bench_id, |b| {
                         b.iter(|| {
                             cuda_keyswitch_lwe_ciphertext(
@@ -958,6 +965,7 @@ mod cuda {
                     let gpu_count = get_number_of_gpus() as usize;
 
                     bench_id = format!("{bench_name}::throughput::{name}");
+                    println!("{bench_id}");
                     let blocks: usize = 1;
                     let elements = throughput_num_threads(blocks, 1);
                     let elements_per_stream = elements as usize / gpu_count;
 
@@ -62,6 +62,7 @@ fn modulus_switch_noise_reduction(c: &mut Criterion) {
             .measurement_time(std::time::Duration::from_secs(5));
 
         let bench_name = format!("modulus_switch_noise_reduction_{count}");
+        println!("{bench_name}");
 
         bench_group.bench_function(&bench_name, |b| {
             b.iter(|| {
 
@@ -296,6 +296,7 @@ mod cuda {
                     CudaLweCiphertextList::from_lwe_ciphertext(&out_pbs_ct, &streams);
 
                 bench_id = format!("{bench_name}::{params_name}");
+                println!("{bench_id}");
                 {
                     bench_group.bench_function(&bench_id, |b| {
                         b.iter(|| {
@@ -317,6 +318,7 @@ mod cuda {
                 let gpu_count = get_number_of_gpus() as usize;
 
                 bench_id = format!("{bench_name}::throughput::{params_name}");
+                println!("{bench_id}");
                 let blocks: usize = 1;
                 let elements = throughput_num_threads(blocks, 1);
                 let elements_per_stream = elements as usize / gpu_count;
@@ -541,6 +543,7 @@ mod cuda {
                 let cuda_indexes = CudaIndexes::new(&h_indexes, &streams, 0);
 
                 bench_id = format!("{bench_name}::{params_name}");
+                println!("{bench_id}");
                 {
                     bench_group.bench_function(&bench_id, |b| {
                         b.iter(|| {
@@ -564,6 +567,7 @@ mod cuda {
                 let gpu_count = get_number_of_gpus() as usize;
 
                 bench_id = format!("{bench_name}::throughput::{params_name}");
+                println!("{bench_id}");
                 let blocks: usize = 1;
                 let elements = throughput_num_threads(blocks, 1);
                 let elements_per_stream = elements as usize / gpu_count;
 
@@ -97,6 +97,7 @@ fn mem_optimized_pbs<Scalar: UnsignedTorus + CastInto<usize> + Serialize>(
                 );
 
                 bench_id = format!("{bench_name}::{name}");
+                println!("{bench_id}");
 
                 bench_group.bench_function(&bench_id, |b| {
                     b.iter(|| {
@@ -114,6 +115,7 @@ fn mem_optimized_pbs<Scalar: UnsignedTorus + CastInto<usize> + Serialize>(
             }
             BenchmarkType::Throughput => {
                 bench_id = format!("{bench_name}::throughput::{name}");
+                println!("{bench_id}");
                 let blocks: usize = 1;
                 let elements = throughput_num_threads(blocks, 1);
                 bench_group.throughput(Throughput::Elements(elements));
@@ -326,6 +328,7 @@ fn mem_optimized_batched_pbs<Scalar: UnsignedTorus + CastInto<usize> + Serialize
         );
 
                 bench_id = format!("{bench_name}::{name}");
+                println!("{bench_id}");
                 bench_group.bench_function(&bench_id, |b| {
                     b.iter(|| {
                         batch_programmable_bootstrap_lwe_ciphertext_mem_optimized(
@@ -342,6 +345,7 @@ fn mem_optimized_batched_pbs<Scalar: UnsignedTorus + CastInto<usize> + Serialize
             }
             BenchmarkType::Throughput => {
                 bench_id = format!("{bench_name}::throughput::{name}");
+                println!("{bench_id}");
                 let blocks: usize = 1;
                 let elements = throughput_num_threads(blocks, 1);
                 bench_group.throughput(Throughput::Elements(elements));
@@ -552,6 +556,7 @@ fn multi_bit_pbs<
                 );
 
                 bench_id = format!("{bench_name}::{name}::parallelized");
+                println!("{bench_id}");
                 bench_group.bench_function(&bench_id, |b| {
                     b.iter(|| {
                         multi_bit_programmable_bootstrap_lwe_ciphertext(
@@ -568,6 +573,7 @@ fn multi_bit_pbs<
             }
             BenchmarkType::Throughput => {
                 bench_id = format!("{bench_name}::throughput::{name}");
+                println!("{bench_id}");
                 let blocks: usize = 1;
                 let elements = throughput_num_threads(blocks, 1);
                 bench_group.throughput(Throughput::Elements(elements));
@@ -779,6 +785,7 @@ fn mem_optimized_pbs_ntt(c: &mut Criterion) {
                 buffers.resize(stack_size);
 
                 bench_id = format!("{bench_name}::{name}");
+                println!("{bench_id}");
                 bench_group.bench_function(&bench_id, |b| {
                     b.iter(|| {
                         programmable_bootstrap_ntt64_lwe_ciphertext_mem_optimized(
@@ -795,6 +802,7 @@ fn mem_optimized_pbs_ntt(c: &mut Criterion) {
             }
             BenchmarkType::Throughput => {
                 bench_id = format!("{bench_name}::throughput::{name}");
+                println!("{bench_id}");
                 let blocks: usize = 1;
                 let elements = throughput_num_threads(blocks, 1);
                 bench_group.throughput(Throughput::Elements(elements));
@@ -1020,6 +1028,7 @@ mod cuda {
                     let cuda_indexes = CudaIndexes::new(&h_indexes, &streams, 0);
 
                     bench_id = format!("{bench_name}::{name}");
+                    println!("{bench_id}");
                     {
                         bench_group.bench_function(&bench_id, |b| {
                             b.iter(|| {
@@ -1043,6 +1052,7 @@ mod cuda {
                     let gpu_count = get_number_of_gpus() as usize;
 
                     bench_id = format!("{bench_name}::throughput::{name}");
+                    println!("{bench_id}");
                     let blocks: usize = 1;
                     let elements = throughput_num_threads(blocks, 1);
                     let elements_per_stream = elements as usize / gpu_count;
@@ -1280,6 +1290,7 @@ mod cuda {
                     let cuda_indexes = CudaIndexes::new(&h_indexes, &streams, 0);
 
                     bench_id = format!("{bench_name}::{name}");
+                    println!("{bench_id}");
                     bench_group.bench_function(&bench_id, |b| {
                         b.iter(|| {
                             cuda_multi_bit_programmable_bootstrap_lwe_ciphertext(
@@ -1301,6 +1312,7 @@ mod cuda {
                     let gpu_count = get_number_of_gpus() as usize;
 
                     bench_id = format!("{bench_name}::throughput::{name}");
+                    println!("{bench_id}");
                     let blocks: usize = 1;
                     let elements = throughput_num_threads(blocks, 1);
                     let elements_per_stream = elements as usize / gpu_count;