nervosnetwork
diff --git a/‎script/src/scheduler.rs‎
Lines changed: 190 additions & 58 deletions b/‎script/src/scheduler.rs‎
Lines changed: 190 additions & 58 deletions
@@ -5,8 +5,9 @@ use crate::syscalls::{
 };
 
 use crate::types::{
-    DataLocation, DataPieceId, FIRST_FD_SLOT, FIRST_VM_ID, Fd, FdArgs, FullSuspendedState, Message,
-    ReadState, RunMode, SgData, SyscallGenerator, VmArgs, VmContext, VmId, VmState, WriteState,
+    DataLocation, DataPieceId, FIRST_FD_SLOT, FIRST_VM_ID, Fd, FdArgs, FullSuspendedState,
+    IterationResult, Message, ReadState, RunMode, SgData, SyscallGenerator, TerminatedResult,
+    VmArgs, VmContext, VmId, VmState, WriteState,
 };
 use ckb_traits::{CellDataProvider, ExtensionProvider, HeaderProvider};
 use ckb_types::core::Cycle;
@@ -48,12 +49,12 @@ where
     M: DefaultMachineRunner,
 {
     /// Immutable context data for current running transaction & script.
-    pub sg_data: SgData<DL>,
+    sg_data: SgData<DL>,
 
     /// Syscall generator
-    pub syscall_generator: SyscallGenerator<DL, V, M::Inner>,
+    syscall_generator: SyscallGenerator<DL, V, M::Inner>,
     /// Syscall generator context
-    pub syscall_context: V,
+    syscall_context: V,
 
     /// Total cycles. When a scheduler executes, there are 3 variables
     /// that might all contain charged cycles: +total_cycles+,
@@ -83,29 +84,37 @@ where
     ///
     /// One can consider that +total_cycles+ contains the total cycles
     /// consumed in current scheduler, when the scheduler is not busy executing.
-    pub total_cycles: Arc<AtomicU64>,
+    ///
+    /// NOTE: the above workflow describes the optimal case: `iteration_cycles`
+    /// will always be zero after each iteration. However, our initial implementation
+    /// for Meepo hardfork contains a bug: cycles charged by suspending / resuming
+    /// VMs when processing IOs, will not be reflected in `current cycles` syscalls
+    /// of the subsequent running VMs. To preserve this behavior, consumed cycles in
+    /// iteration_cycles cannot be moved at iterate boundaries. Later hardfork versions
+    /// might fix this, but for the Meepo hardfork, we will have to preserve this behavior.
+    total_cycles: Arc<AtomicU64>,
     /// Iteration cycles, see +total_cycles+ on its usage
-    pub iteration_cycles: Cycle,
+    iteration_cycles: Cycle,
     /// Next vm id used by spawn.
-    pub next_vm_id: VmId,
+    next_vm_id: VmId,
     /// Next fd used by pipe.
-    pub next_fd_slot: u64,
+    next_fd_slot: u64,
     /// Used to store VM state.
-    pub states: BTreeMap<VmId, VmState>,
+    states: BTreeMap<VmId, VmState>,
     /// Used to confirm the owner of fd.
-    pub fds: BTreeMap<Fd, VmId>,
+    fds: BTreeMap<Fd, VmId>,
     /// Verify the VM's inherited fd list.
-    pub inherited_fd: BTreeMap<VmId, Vec<Fd>>,
+    inherited_fd: BTreeMap<VmId, Vec<Fd>>,
     /// Instantiated vms.
-    pub instantiated: BTreeMap<VmId, (VmContext<DL>, M)>,
+    instantiated: BTreeMap<VmId, (VmContext<DL>, M)>,
     /// Suspended vms.
-    pub suspended: BTreeMap<VmId, Snapshot2<DataPieceId>>,
+    suspended: BTreeMap<VmId, Snapshot2<DataPieceId>>,
     /// Terminated vms.
-    pub terminated_vms: BTreeMap<VmId, i8>,
+    terminated_vms: BTreeMap<VmId, i8>,
 
     /// MessageBox is expected to be empty before returning from `run`
     /// function, there is no need to persist messages.
-    pub message_box: Arc<Mutex<Vec<Message>>>,
+    message_box: Arc<Mutex<Vec<Message>>>,
 }
 
 impl<DL, V, M> Scheduler<DL, V, M>
@@ -143,8 +152,40 @@ where
         self.total_cycles.load(Ordering::Acquire)
     }
 
+    /// Fetch specified VM state
+    pub fn state(&self, vm_id: &VmId) -> Option<VmState> {
+        self.states.get(vm_id).cloned()
+    }
+
+    /// Access the SgData data structure
+    pub fn sg_data(&self) -> &SgData<DL> {
+        &self.sg_data
+    }
+
+    /// This function provides a peek into one of the current created
+    /// VM. Depending on the actual state, the VM might either be instantiated
+    /// or suspended. As a result, 2 callback functions must be provided to handle
+    /// both cases. The function only provides a *peek*, meaning the caller must
+    /// not make any changes to an instantiated VMs. the VM is passed as a mutable
+    /// reference only because memory load functions in CKB-VM require mutable
+    /// references. It does not mean the caller can modify the VM in any sense.
+    /// Even a slight tampering of the VM can result in non-determinism.
+    pub fn peek<F, G, W>(&mut self, vm_id: &VmId, mut f: F, mut g: G) -> Result<W, Error>
+    where
+        F: FnMut(&mut M) -> Result<W, Error>,
+        G: FnMut(&Snapshot2<DataPieceId>, &SgData<DL>) -> Result<W, Error>,
+    {
+        if let Some((_, machine)) = self.instantiated.get_mut(vm_id) {
+            return f(machine);
+        }
+        if let Some(snapshot) = self.suspended.get(vm_id) {
+            return g(snapshot, &self.sg_data);
+        }
+        Err(Error::Unexpected(format!("VM {} does not exist!", vm_id)))
+    }
+
     /// Add cycles to total cycles.
-    pub fn consume_cycles(&mut self, cycles: Cycle) -> Result<(), Error> {
+    fn consume_cycles(&mut self, cycles: Cycle) -> Result<(), Error> {
         match self
             .total_cycles
             .fetch_update(Ordering::AcqRel, Ordering::Acquire, |total_cycles| {
@@ -167,7 +208,7 @@ where
             syscall_generator,
             syscall_context,
             total_cycles: Arc::new(AtomicU64::new(full.total_cycles)),
-            iteration_cycles: 0,
+            iteration_cycles: full.iteration_cycles,
             next_vm_id: full.next_vm_id,
             next_fd_slot: full.next_fd_slot,
             states: full
@@ -217,6 +258,7 @@ where
             // consensus. We are not charging cycles for suspending
             // a VM in the process of suspending the whole scheduler.
             total_cycles: self.total_cycles.load(Ordering::Acquire),
+            iteration_cycles: self.iteration_cycles,
             next_vm_id: self.next_vm_id,
             next_fd_slot: self.next_fd_slot,
             vms,
@@ -240,50 +282,51 @@ where
     /// * Cycle limit reached, the returned error would be ckb_vm::Error::CyclesExceeded,
     /// * Pause trigger, the returned error would be ckb_vm::Error::Pause,
     /// * Other terminating errors
-    pub fn run(&mut self, mode: RunMode) -> Result<(i8, Cycle), Error> {
-        if self.states.is_empty() {
-            // Booting phase, we will need to initialize the first VM.
-            let program_id = self.sg_data.sg_info.program_data_piece_id.clone();
-            assert_eq!(
-                self.boot_vm(
-                    &DataLocation {
-                        data_piece_id: program_id,
-                        offset: 0,
-                        length: u64::MAX,
-                    },
-                    VmArgs::Vector(vec![]),
-                )?,
-                ROOT_VM_ID
-            );
-        }
-        assert!(self.states.contains_key(&ROOT_VM_ID));
+    pub fn run(&mut self, mode: RunMode) -> Result<TerminatedResult, Error> {
+        self.boot_root_vm_if_needed()?;
 
         let (pause, mut limit_cycles) = match mode {
             RunMode::LimitCycles(limit_cycles) => (Pause::new(), limit_cycles),
             RunMode::Pause(pause) => (pause, u64::MAX),
         };
 
-        while self.states[&ROOT_VM_ID] != VmState::Terminated {
-            assert_eq!(self.iteration_cycles, 0);
-            let iterate_return = self.iterate(pause.clone(), limit_cycles);
-            self.consume_cycles(self.iteration_cycles)?;
-            limit_cycles = limit_cycles
-                .checked_sub(self.iteration_cycles)
-                .ok_or(Error::CyclesExceeded)?;
-            // Clear iteration cycles intentionally after each run
-            self.iteration_cycles = 0;
-            iterate_return?;
+        while !self.terminated() {
+            limit_cycles = self.iterate_outer(&pause, limit_cycles)?.1;
         }
+        assert_eq!(self.iteration_cycles, 0);
 
-        // At this point, root VM cannot be suspended
-        let root_vm = &self.instantiated[&ROOT_VM_ID];
-        Ok((root_vm.1.machine().exit_code(), self.consumed_cycles()))
+        self.terminated_result()
+    }
+
+    /// Public API that runs a single VM, processes all messages, then returns the
+    /// executed VM ID(so caller can fetch later data). This can be used when more
+    /// finer tweaks are required for a single VM.
+    pub fn iterate(&mut self) -> Result<IterationResult, Error> {
+        self.boot_root_vm_if_needed()?;
+
+        if self.terminated() {
+            return Ok(IterationResult {
+                executed_vm: ROOT_VM_ID,
+                terminated_status: Some(self.terminated_result()?),
+            });
+        }
+
+        let (id, _) = self.iterate_outer(&Pause::new(), u64::MAX)?;
+        let terminated_status = if self.terminated() {
+            assert_eq!(self.iteration_cycles, 0);
+            Some(self.terminated_result()?)
+        } else {
+            None
+        };
+
+        Ok(IterationResult {
+            executed_vm: id,
+            terminated_status,
+        })
     }
 
     /// Returns the machine that needs to be executed in the current iterate.
-    pub fn iterate_prepare_machine(&mut self) -> Result<(u64, &mut M), Error> {
-        // Process all pending VM reads & writes.
-        self.process_io()?;
+    fn iterate_prepare_machine(&mut self) -> Result<(u64, &mut M), Error> {
         // Find a runnable VM that has the largest ID.
         let vm_id_to_run = self
             .states
@@ -300,7 +343,7 @@ where
     }
 
     /// Process machine execution results in the current iterate.
-    pub fn iterate_process_results(
+    fn iterate_process_results(
         &mut self,
         vm_id_to_run: u64,
         result: Result<i8, Error>,
@@ -309,7 +352,7 @@ where
         self.process_message_box()?;
         assert!(self.message_box.lock().expect("lock").is_empty());
         // If the VM terminates, update VMs in join state, also closes its fds
-        match result {
+        let result = match result {
             Ok(code) => {
                 self.terminated_vms.insert(vm_id_to_run, code);
                 // When root VM terminates, the execution stops immediately, we will purge
@@ -357,13 +400,59 @@ where
             }
             Err(Error::Yield) => Ok(()),
             Err(e) => Err(e),
-        }
+        };
+        result
+    }
+
+    // This internal function is actually a wrapper over +iterate_inner+,
+    // it is split into a different function, so cycle calculation will be
+    // executed no matter what result +iterate_inner+ returns.
+    #[inline]
+    fn iterate_outer(
+        &mut self,
+        pause: &Pause,
+        limit_cycles: Cycle,
+    ) -> Result<(VmId, Cycle), Error> {
+        let iterate_return = self.iterate_inner(pause.clone(), limit_cycles);
+        self.consume_cycles(self.iteration_cycles)?;
+        let remaining_cycles = limit_cycles
+            .checked_sub(self.iteration_cycles)
+            .ok_or(Error::CyclesExceeded)?;
+        // Clear iteration cycles intentionally after each run
+        self.iteration_cycles = 0;
+        // Process all pending VM reads & writes. Notice ideally, this invocation
+        // should be put at the end of `iterate_inner` function. However, 2 things
+        // prevent this:
+        //
+        // * In earlier implementation of the Meepo hardfork version, `self.process_io`
+        // was put at the very start of +iterate_prepare_machine+ method. Meaning we used
+        // to process IO syscalls at the very start of a new iteration.
+        // * Earlier implementation contains a bug that cycles consumed by suspending / resuming
+        // VMs are not updated in the subsequent VM's `current cycles` syscalls.
+        //
+        // To make ckb-script package suitable for outside usage, we want IOs processed at
+        // the end of each iteration, not at the start of the next iteration. We also need
+        // to replicate the exact same runtime behavior of Meepo hardfork. This means the only
+        // viable change will be:
+        //
+        // * Move `self.process_io` call to the very end of `iterate_outer` method, which is
+        // exactly current location
+        // * For now we have to live with the fact that `iteration_cycles` will not always be
+        // zero at iteration boundaries, and also preserve its value in `FullSuspendedState`.
+        //
+        // One expected change is that +process_io+ is now called once more
+        // after the whole scheduler terminates, and not called at the very beginning
+        // when no VM is executing. But since no VMs will be in IO states at this 2 timeslot,
+        // we should be fine here.
+        self.process_io()?;
+        let id = iterate_return?;
+        Ok((id, remaining_cycles))
     }
 
     // This is internal function that does the actual VM execution loop.
     // Here both pause signal and limit_cycles are provided so as to simplify
     // branches.
-    fn iterate(&mut self, pause: Pause, limit_cycles: Cycle) -> Result<(), Error> {
+    fn iterate_inner(&mut self, pause: Pause, limit_cycles: Cycle) -> Result<VmId, Error> {
         // Execute the VM for real, consumed cycles in the virtual machine is
         // moved over to +iteration_cycles+, then we reset virtual machine's own
         // cycle count to zero.
@@ -380,7 +469,8 @@ where
             .iteration_cycles
             .checked_add(cycles)
             .ok_or(Error::CyclesExceeded)?;
-        self.iterate_process_results(id, result)
+        self.iterate_process_results(id, result)?;
+        Ok(id)
     }
 
     fn process_message_box(&mut self) -> Result<(), Error> {
@@ -774,6 +864,27 @@ where
         Ok(())
     }
 
+    /// If current scheduler is terminated
+    pub fn terminated(&self) -> bool {
+        self.states
+            .get(&ROOT_VM_ID)
+            .map(|state| *state == VmState::Terminated)
+            .unwrap_or(false)
+    }
+
+    fn terminated_result(&mut self) -> Result<TerminatedResult, Error> {
+        assert!(self.terminated());
+
+        let exit_code = {
+            let root_vm = &self.ensure_get_instantiated(&ROOT_VM_ID)?.1;
+            root_vm.machine().exit_code()
+        };
+        Ok(TerminatedResult {
+            exit_code,
+            consumed_cycles: self.consumed_cycles(),
+        })
+    }
+
     // Ensure VMs are instantiated
     fn ensure_vms_instantiated(&mut self, ids: &[VmId]) -> Result<(), Error> {
         if ids.len() > MAX_INSTANTIATED_VMS {
@@ -815,7 +926,7 @@ where
         Ok(())
     }
 
-    // Ensure corresponding VM is instantiated and return a mutable reference to it
+    /// Ensure corresponding VM is instantiated and return a mutable reference to it
     fn ensure_get_instantiated(&mut self, id: &VmId) -> Result<&mut (VmContext<DL>, M), Error> {
         self.ensure_vms_instantiated(&[*id])?;
         self.instantiated
@@ -868,8 +979,29 @@ where
         Ok(())
     }
 
+    fn boot_root_vm_if_needed(&mut self) -> Result<(), Error> {
+        if self.states.is_empty() {
+            // Booting phase, we will need to initialize the first VM.
+            let program_id = self.sg_data.sg_info.program_data_piece_id.clone();
+            assert_eq!(
+                self.boot_vm(
+                    &DataLocation {
+                        data_piece_id: program_id,
+                        offset: 0,
+                        length: u64::MAX,
+                    },
+                    VmArgs::Vector(vec![]),
+                )?,
+                ROOT_VM_ID
+            );
+        }
+        assert!(self.states.contains_key(&ROOT_VM_ID));
+
+        Ok(())
+    }
+
     /// Boot a vm by given program and args.
-    pub fn boot_vm(&mut self, location: &DataLocation, args: VmArgs) -> Result<VmId, Error> {
+    fn boot_vm(&mut self, location: &DataLocation, args: VmArgs) -> Result<VmId, Error> {
         let id = self.next_vm_id;
         self.next_vm_id += 1;
         let (context, mut machine) = self.create_dummy_vm(&id)?;