AcademySoftwareFoundation
diff --git a/‎rust/crates/opencue-proto/src/lib.rs‎
Lines changed: 0 additions & 111 deletions b/‎rust/crates/opencue-proto/src/lib.rs‎
Lines changed: 0 additions & 111 deletions
diff --git a/‎rust/crates/rqd/src/frame/manager.rs‎
Lines changed: 47 additions & 23 deletions b/‎rust/crates/rqd/src/frame/manager.rs‎
Lines changed: 47 additions & 23 deletions
@@ -2,7 +2,6 @@ use core::fmt;
 
 use host::Host;
 use job::{Frame, Job};
-use report::CoreDetail;
 use rqd::RunFrame;
 use uuid::Uuid;
 
@@ -127,113 +126,3 @@ impl fmt::Display for Host {
         write!(f, "{}/({})", self.name, self.id)
     }
 }
-
-impl CoreDetail {
-    /// Update CoreDetail by reserving a number of cores
-    ///
-    /// # Arguments
-    ///
-    /// * `core_count_with_multiplier` - Number of cores to reserve multiplied by core_multiplier
-    ///
-    /// # Returns
-    ///
-    /// * `Ok(())` if cores were reserved successfully
-    /// * `Err(String)` if trying to reserve more cores than are available
-    pub fn register_reservation(
-        &mut self,
-        core_count_with_multiplier: usize,
-    ) -> Result<(), String> {
-        if self.idle_cores - (core_count_with_multiplier as i32) < 0 {
-            Err(format!(
-                "Tried to reserve {} out of {} cores available",
-                core_count_with_multiplier, self.idle_cores,
-            ))
-        } else {
-            self.idle_cores -= core_count_with_multiplier as i32;
-            self.booked_cores += core_count_with_multiplier as i32;
-            Ok(())
-        }
-    }
-
-    /// Update CoreDetail by releasing a number of previously reserved cores
-    ///
-    /// # Arguments
-    ///
-    /// * `core_count_with_multiplier` - The number of cores to release multiplied by core_multiplier
-    ///
-    /// # Returns
-    ///
-    /// * `Ok(())` if cores were released successfully
-    /// * `Err(String)` if trying to release more cores than are currently reserved
-    pub fn register_release(&mut self, core_count_with_multiplier: u32) -> Result<(), String> {
-        if self.booked_cores < core_count_with_multiplier as i32 {
-            Err(format!(
-                "Tried to release {} out of {} cores reserved",
-                core_count_with_multiplier, self.booked_cores,
-            ))
-        } else {
-            self.idle_cores += core_count_with_multiplier as i32;
-            self.booked_cores -= core_count_with_multiplier as i32;
-            Ok(())
-        }
-    }
-
-    /// Update CoreDetail by locking a specified number of cores. If the amount requested is
-    /// not available, the maximum available will be reserved.
-    ///
-    /// # Arguments
-    ///
-    /// * `count_with_multiplier` - Number of cores to lock multiplied by core_multiplier
-    ///
-    /// # Returns
-    ///
-    /// * `u32` - The actual number of cores that were locked (may be less than requested if not enough are available)
-    pub fn lock_cores(&mut self, count_with_multiplier: u32) -> u32 {
-        let amount_not_locked = self.total_cores - self.locked_cores;
-        let amount_to_lock = std::cmp::min(amount_not_locked, count_with_multiplier as i32);
-
-        if amount_to_lock > 0 {
-            self.locked_cores += amount_to_lock;
-            self.idle_cores -= std::cmp::min(amount_to_lock, self.idle_cores)
-        }
-
-        amount_to_lock as u32
-    }
-
-    /// Update CoreDetail by locking all available cores
-    ///
-    /// This will set idle_cores to 0 and locked_cores to total_cores
-    pub fn lock_all_cores(&mut self) {
-        self.idle_cores = 0;
-        self.locked_cores = self.total_cores;
-    }
-
-    /// Update CoreDetail by unlocking a specified number of cores that were previously locked.
-    ///
-    /// # Arguments
-    ///
-    /// * `count_with_multiplier` - Number of cores to unlock multiplied by core_multiplier
-    ///
-    /// # Returns
-    ///
-    /// * `u32` - The actual number of cores that were unlocked (may be less than requested if fewer cores are locked)
-    pub fn unlock_cores(&mut self, count_with_multiplier: u32) -> u32 {
-        let amount_to_unlock = std::cmp::min(count_with_multiplier as i32, self.locked_cores);
-
-        if amount_to_unlock > 0 {
-            self.locked_cores -= amount_to_unlock;
-            self.idle_cores += amount_to_unlock;
-        }
-        amount_to_unlock as u32
-    }
-
-    /// Update CoreDetail by unlocking all locked cores
-    ///
-    /// This will unlock all locked cores and add them to idle_cores
-    pub fn unlock_all_cores(&mut self) {
-        if self.locked_cores > 0 {
-            self.idle_cores += self.locked_cores;
-            self.locked_cores = 0;
-        }
-    }
-}
@@ -1,4 +1,5 @@
 use chrono::{DateTime, Local};
+use itertools::Either;
 use miette::{Diagnostic, Result, miette};
 use opencue_proto::{
     host::HardwareState,
@@ -64,17 +65,14 @@ impl FrameManager {
 
         // **Attention**: If an error happens between here and spawning a frame, the resources
         // reserved need to be released.
-        //
-        // Cuebot unfortunatelly uses a hardcoded frame environment variable to signal if
-        // a frame is hyperthreaded. Rqd should only reserve cores if a frame is hyperthreaded.
-        let hyperthreaded = run_frame
-            .environment
-            .get("CUE_THREADABLE")
-            .is_some_and(|v| v == "1");
+
         let num_cores = (run_frame.num_cores as u32).div_ceil(self.config.machine.core_multiplier);
+
+        // Reserving cores will always yield a list of reserved thread_ids. If hyperthreading is off,
+        // the list should be ignored
         let thread_ids = self
             .machine
-            .reserve_cores(num_cores as usize, run_frame.resource_id(), hyperthreaded)
+            .reserve_cores(Either::Left(num_cores as usize), run_frame.resource_id())
             .await
             .map_err(|err| {
                 FrameManagerError::Aborted(format!(
@@ -90,7 +88,13 @@ impl FrameManager {
                 let reserved_res = self.machine.reserve_gpus(run_frame.num_gpus as u32).await;
                 if reserved_res.is_err() {
                     // Release cores reserved on the last step
-                    self.machine.release_cores(num_cores, &thread_ids).await;
+                    if let Err(err) = self.machine.release_cores(&run_frame.resource_id()).await {
+                        warn!(
+                            "Failed to release cores reserved for {} during gpu reservation failure. {}",
+                            &run_frame.resource_id(),
+                            err
+                        )
+                    };
                 }
                 Some(reserved_res.map_err(|err| {
                     FrameManagerError::Aborted(format!(
@@ -101,20 +105,35 @@ impl FrameManager {
             }
         };
 
+        // Cuebot unfortunatelly uses a hardcoded frame environment variable to signal if
+        // a frame is hyperthreaded. Rqd should only reserve cores if a frame is hyperthreaded.
+        let hyperthreaded = run_frame
+            .environment
+            .get("CUE_THREADABLE")
+            .is_some_and(|v| v == "1");
+        // Ignore the list of allocated threads if hyperthreading is off
+        let thread_ids = hyperthreaded.then_some(thread_ids);
+
+        let resource_id = run_frame.resource_id();
         let running_frame = Arc::new(RunningFrame::init(
             run_frame,
             uid,
             self.config.runner.clone(),
-            thread_ids.clone(),
+            thread_ids,
             gpu_list,
             self.machine.get_host_name().await,
         ));
 
         if self.config.runner.run_on_docker {
             self.spawn_docker_frame(running_frame, false);
         } else if self.spawn_running_frame(running_frame, false).is_err() {
-            // Release cores reserved on the last step
-            self.machine.release_cores(num_cores, &thread_ids).await;
+            // Release cores reserved if spawning the frame failed
+            if let Err(err) = self.machine.release_cores(&resource_id).await {
+                warn!(
+                    "Failed to release cores reserved for {} during spawn failure. {}",
+                    &resource_id, err
+                );
+            }
         }
 
         Ok(())
@@ -161,33 +180,38 @@ impl FrameManager {
                 Ok(running_frame) => {
                     // Update reservations. If a thread_ids list exists, the frame was booked using affinity
                     if let Err(err) = match &running_frame.thread_ids {
-                        Some(thread_ids) => self
-                            .machine
-                            .reserve_cores_by_id(thread_ids, running_frame.request.resource_id())
-                            .await
-                            .map(Some),
+                        Some(thread_ids) => {
+                            self.machine
+                                .reserve_cores(
+                                    Either::Right(thread_ids.clone()),
+                                    running_frame.request.resource_id(),
+                                )
+                                .await
+                        }
                         None => {
                             let num_cores = (running_frame.request.num_cores as u32)
                                 .div_ceil(self.config.machine.core_multiplier);
                             self.machine
                                 .reserve_cores(
-                                    num_cores as usize,
+                                    Either::Left(num_cores as usize),
                                     running_frame.request.resource_id(),
-                                    false,
                                 )
                                 .await
                         }
                     } {
                         errors.push(err.to_string());
                     }
 
-                    let num_cores = (running_frame.request.num_cores as u32)
-                        .div_ceil(self.config.machine.core_multiplier);
-                    let thread_ids = &running_frame.thread_ids.clone();
+                    let resource_id = running_frame.request.resource_id();
                     if self.config.runner.run_on_docker {
                         todo!("Recovering frames when running on docker is not yet supported")
                     } else if self.spawn_running_frame(running_frame, true).is_err() {
-                        self.machine.release_cores(num_cores, thread_ids).await;
+                        if let Err(err) = self.machine.release_cores(&resource_id).await {
+                            warn!(
+                                "Failed to release cores reserved for {} during recover spawn error. {}",
+                                &resource_id, err
+                            );
+                        }
                     }
                 }
                 Err(err) => {