zama-ai
diff --git a/‎tfhe/src/high_level_api/integers/signed/ops.rs
Lines changed: 91 additions & 1 deletion b/‎tfhe/src/high_level_api/integers/signed/ops.rs
Lines changed: 91 additions & 1 deletion
diff --git a/‎tfhe/src/high_level_api/integers/signed/scalar_ops.rs
Lines changed: 98 additions & 1 deletion b/‎tfhe/src/high_level_api/integers/signed/scalar_ops.rs
Lines changed: 98 additions & 1 deletion
diff --git a/‎tfhe/src/high_level_api/integers/signed/tests/gpu.rs
Lines changed: 57 additions & 2 deletions b/‎tfhe/src/high_level_api/integers/signed/tests/gpu.rs
Lines changed: 57 additions & 2 deletions
@@ -6,7 +6,8 @@ use crate::high_level_api::keys::InternalServerKey;
 #[cfg(feature = "gpu")]
 use crate::high_level_api::traits::{
     AddSizeOnGpu, BitAndSizeOnGpu, BitNotSizeOnGpu, BitOrSizeOnGpu, BitXorSizeOnGpu,
-    FheMaxSizeOnGpu, FheMinSizeOnGpu, FheOrdSizeOnGpu, SizeOnGpu, SubSizeOnGpu,
+    FheMaxSizeOnGpu, FheMinSizeOnGpu, FheOrdSizeOnGpu, RotateLeftSizeOnGpu, RotateRightSizeOnGpu,
+    ShlSizeOnGpu, ShrSizeOnGpu, SizeOnGpu, SubSizeOnGpu,
 };
 use crate::high_level_api::traits::{
     DivRem, FheEq, FheMax, FheMin, FheOrd, RotateLeft, RotateLeftAssign, RotateRight,
@@ -2363,3 +2364,92 @@ where
         })
     }
 }
+
+#[cfg(feature = "gpu")]
+impl<Id, Id2> ShlSizeOnGpu<&FheUint<Id2>> for FheInt<Id>
+where
+    Id: FheIntId,
+    Id2: FheUintId,
+{
+    fn get_left_shift_size_on_gpu(&self, rhs: &FheUint<Id2>) -> u64 {
+        global_state::with_internal_keys(|key| {
+            if let InternalServerKey::Cuda(cuda_key) = key {
+                with_thread_local_cuda_streams(|streams| {
+                    cuda_key.key.key.get_left_shift_size_on_gpu(
+                        &*self.ciphertext.on_gpu(streams),
+                        &rhs.ciphertext.on_gpu(streams),
+                        streams,
+                    )
+                })
+            } else {
+                0
+            }
+        })
+    }
+}
+#[cfg(feature = "gpu")]
+impl<Id, Id2> ShrSizeOnGpu<&FheUint<Id2>> for FheInt<Id>
+where
+    Id: FheIntId,
+    Id2: FheUintId,
+{
+    fn get_right_shift_size_on_gpu(&self, rhs: &FheUint<Id2>) -> u64 {
+        global_state::with_internal_keys(|key| {
+            if let InternalServerKey::Cuda(cuda_key) = key {
+                with_thread_local_cuda_streams(|streams| {
+                    cuda_key.key.key.get_right_shift_size_on_gpu(
+                        &*self.ciphertext.on_gpu(streams),
+                        &rhs.ciphertext.on_gpu(streams),
+                        streams,
+                    )
+                })
+            } else {
+                0
+            }
+        })
+    }
+}
+#[cfg(feature = "gpu")]
+impl<Id, Id2> RotateLeftSizeOnGpu<&FheUint<Id2>> for FheInt<Id>
+where
+    Id: FheIntId,
+    Id2: FheUintId,
+{
+    fn get_rotate_left_size_on_gpu(&self, rhs: &FheUint<Id2>) -> u64 {
+        global_state::with_internal_keys(|key| {
+            if let InternalServerKey::Cuda(cuda_key) = key {
+                with_thread_local_cuda_streams(|streams| {
+                    cuda_key.key.key.get_rotate_left_size_on_gpu(
+                        &*self.ciphertext.on_gpu(streams),
+                        &rhs.ciphertext.on_gpu(streams),
+                        streams,
+                    )
+                })
+            } else {
+                0
+            }
+        })
+    }
+}
+#[cfg(feature = "gpu")]
+impl<Id, Id2> RotateRightSizeOnGpu<&FheUint<Id2>> for FheInt<Id>
+where
+    Id: FheIntId,
+    Id2: FheUintId,
+{
+    fn get_rotate_right_size_on_gpu(&self, rhs: &FheUint<Id2>) -> u64 {
+        global_state::with_internal_keys(|key| {
+            if let InternalServerKey::Cuda(cuda_key) = key {
+                with_thread_local_cuda_streams(|streams| {
+                    cuda_key.key.key.get_rotate_right_size_on_gpu(
+                        &*self.ciphertext.on_gpu(streams),
+                        &rhs.ciphertext.on_gpu(streams),
+                        streams,
+                    )
+                })
+            } else {
+                0
+            }
+        })
+    }
+}
@@ -10,7 +10,8 @@ use crate::high_level_api::keys::InternalServerKey;
 #[cfg(feature = "gpu")]
 use crate::high_level_api::traits::{
     AddSizeOnGpu, BitAndSizeOnGpu, BitOrSizeOnGpu, BitXorSizeOnGpu, FheMaxSizeOnGpu,
-    FheMinSizeOnGpu, FheOrdSizeOnGpu, SubSizeOnGpu,
+    FheMinSizeOnGpu, FheOrdSizeOnGpu, RotateLeftSizeOnGpu, RotateRightSizeOnGpu, ShlSizeOnGpu,
+    ShrSizeOnGpu, SubSizeOnGpu,
 };
 use crate::high_level_api::traits::{
     DivRem, FheEq, FheMax, FheMin, FheOrd, RotateLeft, RotateLeftAssign, RotateRight,
@@ -628,6 +629,30 @@ macro_rules! define_scalar_rotate_shifts {
                 )*
         );
 
+        #[cfg(feature = "gpu")]
+        generic_integer_impl_get_scalar_operation_size_on_gpu!(
+            rust_trait: ShlSizeOnGpu(get_left_shift_size_on_gpu),
+            implem: {
+                |lhs: &FheInt<_>, _rhs| {
+                    global_state::with_internal_keys(|key|
+                    if let InternalServerKey::Cuda(cuda_key) = key {
+                        with_thread_local_cuda_streams(|streams| {
+                            cuda_key.key.key.get_scalar_left_shift_size_on_gpu(
+                                &*lhs.ciphertext.on_gpu(streams),
+                                streams,
+                            )
+                        })
+                    } else {
+                        0
+                    })
+                }
+            },
+            fhe_and_scalar_type:
+                $(
+                    ($concrete_type, $($scalar_type,)*),
+                )*
+        );
+
         generic_integer_impl_scalar_operation!(
             rust_trait: Shr(shr),
             implem: {
@@ -661,6 +686,30 @@ macro_rules! define_scalar_rotate_shifts {
                 )*
         );
 
+        #[cfg(feature = "gpu")]
+        generic_integer_impl_get_scalar_operation_size_on_gpu!(
+            rust_trait: ShrSizeOnGpu(get_right_shift_size_on_gpu),
+            implem: {
+                |lhs: &FheInt<_>, _rhs| {
+                    global_state::with_internal_keys(|key|
+                    if let InternalServerKey::Cuda(cuda_key) = key {
+                        with_thread_local_cuda_streams(|streams| {
+                            cuda_key.key.key.get_scalar_right_shift_size_on_gpu(
+                                &*lhs.ciphertext.on_gpu(streams),
+                                streams,
+                            )
+                        })
+                    } else {
+                        0
+                    })
+                }
+            },
+            fhe_and_scalar_type:
+                $(
+                    ($concrete_type, $($scalar_type,)*),
+                )*
+        );
+
         generic_integer_impl_scalar_operation!(
             rust_trait: RotateLeft(rotate_left),
             implem: {
@@ -694,6 +743,30 @@ macro_rules! define_scalar_rotate_shifts {
                 )*
         );
 
+        #[cfg(feature = "gpu")]
+        generic_integer_impl_get_scalar_operation_size_on_gpu!(
+            rust_trait: RotateLeftSizeOnGpu(get_rotate_left_size_on_gpu),
+            implem: {
+                |lhs: &FheInt<_>, _rhs| {
+                    global_state::with_internal_keys(|key|
+                    if let InternalServerKey::Cuda(cuda_key) = key {
+                        with_thread_local_cuda_streams(|streams| {
+                            cuda_key.key.key.get_scalar_rotate_left_size_on_gpu(
+                                &*lhs.ciphertext.on_gpu(streams),
+                                streams,
+                            )
+                        })
+                    } else {
+                        0
+                    })
+                }
+            },
+            fhe_and_scalar_type:
+                $(
+                    ($concrete_type, $($scalar_type,)*),
+                )*
+        );
+
         generic_integer_impl_scalar_operation!(
             rust_trait: RotateRight(rotate_right),
             implem: {
@@ -727,6 +800,30 @@ macro_rules! define_scalar_rotate_shifts {
                 )*
         );
 
+        #[cfg(feature = "gpu")]
+        generic_integer_impl_get_scalar_operation_size_on_gpu!(
+            rust_trait: RotateRightSizeOnGpu(get_rotate_right_size_on_gpu),
+            implem: {
+                |lhs: &FheInt<_>, _rhs| {
+                    global_state::with_internal_keys(|key|
+                    if let InternalServerKey::Cuda(cuda_key) = key {
+                        with_thread_local_cuda_streams(|streams| {
+                            cuda_key.key.key.get_scalar_rotate_right_size_on_gpu(
+                                &*lhs.ciphertext.on_gpu(streams),
+                                streams,
+                            )
+                        })
+                    } else {
+                        0
+                    })
+                }
+            },
+            fhe_and_scalar_type:
+                $(
+                    ($concrete_type, $($scalar_type,)*),
+                )*
+        );
+
         generic_integer_impl_scalar_operation_assign!(
             rust_trait: ShlAssign(shl_assign),
             implem: {
 
@@ -5,10 +5,10 @@ use crate::high_level_api::integers::unsigned::tests::gpu::setup_gpu;
 use crate::prelude::{
     check_valid_cuda_malloc, AddSizeOnGpu, BitAndSizeOnGpu, BitNotSizeOnGpu, BitOrSizeOnGpu,
     BitXorSizeOnGpu, FheMaxSizeOnGpu, FheMinSizeOnGpu, FheOrdSizeOnGpu, FheTryEncrypt,
-    SubSizeOnGpu,
+    RotateLeftSizeOnGpu, RotateRightSizeOnGpu, ShlSizeOnGpu, ShrSizeOnGpu, SubSizeOnGpu,
 };
 use crate::shortint::parameters::PARAM_GPU_MULTI_BIT_GROUP_4_MESSAGE_2_CARRY_2_KS_PBS;
-use crate::{FheInt32, GpuIndex};
+use crate::{FheInt32, FheUint32, GpuIndex};
 use rand::Rng;
 
 #[test]
@@ -236,3 +236,58 @@ fn test_gpu_get_comparisons_size_on_gpu() {
         GpuIndex::new(0)
     ));
 }
+
+#[test]
+fn test_gpu_get_shift_rotate_size_on_gpu() {
+    let cks = setup_gpu(Some(PARAM_GPU_MULTI_BIT_GROUP_4_MESSAGE_2_CARRY_2_KS_PBS));
+    let mut rng = rand::thread_rng();
+    let clear_a = rng.gen_range(1..=i32::MAX);
+    let clear_b = rng.gen_range(1..=u32::MAX);
+    let mut a = FheInt32::try_encrypt(clear_a, &cks).unwrap();
+    let mut b = FheUint32::try_encrypt(clear_b, &cks).unwrap();
+    a.move_to_current_device();
+    b.move_to_current_device();
+    let a = &a;
+    let b = &b;
+
+    let left_shift_tmp_buffer_size = a.get_left_shift_size_on_gpu(b);
+    let scalar_left_shift_tmp_buffer_size = a.get_left_shift_size_on_gpu(clear_b);
+    assert!(check_valid_cuda_malloc(
+        left_shift_tmp_buffer_size,
+        GpuIndex::new(0)
+    ));
+    assert!(check_valid_cuda_malloc(
+        scalar_left_shift_tmp_buffer_size,
+        GpuIndex::new(0)
+    ));
+    let right_shift_tmp_buffer_size = a.get_right_shift_size_on_gpu(b);
+    let scalar_right_shift_tmp_buffer_size = a.get_right_shift_size_on_gpu(clear_b);
+    assert!(check_valid_cuda_malloc(
+        right_shift_tmp_buffer_size,
+        GpuIndex::new(0)
+    ));
+    assert!(check_valid_cuda_malloc(
+        scalar_right_shift_tmp_buffer_size,
+        GpuIndex::new(0)
+    ));
+    let rotate_left_tmp_buffer_size = a.get_rotate_left_size_on_gpu(b);
+    let scalar_rotate_left_tmp_buffer_size = a.get_rotate_left_size_on_gpu(clear_b);
+    assert!(check_valid_cuda_malloc(
+        rotate_left_tmp_buffer_size,
+        GpuIndex::new(0)
+    ));
+    assert!(check_valid_cuda_malloc(
+        scalar_rotate_left_tmp_buffer_size,
+        GpuIndex::new(0)
+    ));
+    let rotate_right_tmp_buffer_size = a.get_rotate_right_size_on_gpu(b);
+    let scalar_rotate_right_tmp_buffer_size = a.get_rotate_right_size_on_gpu(clear_b);
+    assert!(check_valid_cuda_malloc(
+        rotate_right_tmp_buffer_size,
+        GpuIndex::new(0)
+    ));
+    assert!(check_valid_cuda_malloc(
+        scalar_rotate_right_tmp_buffer_size,
+        GpuIndex::new(0)
+    ));
+}