Skip to content

Commit

Permalink
Implement FlattenedArgsReader
Browse files Browse the repository at this point in the history
  • Loading branch information
mohanson committed Jan 16, 2025
1 parent 68a5331 commit 10ec946
Show file tree
Hide file tree
Showing 18 changed files with 259 additions and 172 deletions.
10 changes: 8 additions & 2 deletions examples/check_real_memory.rs
Original file line number Diff line number Diff line change
Expand Up @@ -168,7 +168,10 @@ fn check_asm(memory_size: usize) -> Result<(), ()> {
let core = DefaultMachineBuilder::new(asm_core).build();
let mut machine = AsmMachine::new(core);
machine
.load_program(&Bytes::from(BIN_PATH_BUFFER), &vec![Bytes::from(BIN_NAME)])
.load_program(
&Bytes::from(BIN_PATH_BUFFER),
[Ok(Bytes::from(BIN_NAME))].into_iter(),
)
.unwrap();
let result = machine.run();
assert!(result.is_ok());
Expand All @@ -192,7 +195,10 @@ fn check_asm_in_thread(memory_size: usize) -> Result<(), ()> {
let core = DefaultMachineBuilder::new(asm_core).build();
let mut machine = AsmMachine::new(core);
machine
.load_program(&Bytes::from(BIN_PATH_BUFFER), &vec![Bytes::from(BIN_NAME)])
.load_program(
&Bytes::from(BIN_PATH_BUFFER),
[Ok(Bytes::from(BIN_NAME))].into_iter(),
)
.unwrap();
let thread_join_handle = thread::spawn(move || {
let result = machine.run();
Expand Down
4 changes: 2 additions & 2 deletions examples/ckb_vm_runner.rs
Original file line number Diff line number Diff line change
Expand Up @@ -49,7 +49,7 @@ fn main_asm(code: Bytes, args: Vec<Bytes>) -> Result<(), Box<dyn std::error::Err
.syscall(Box::new(DebugSyscall {}))
.build();
let mut machine = ckb_vm::machine::asm::AsmMachine::new(core);
machine.load_program(&code, &args)?;
machine.load_program(&code, args.into_iter().map(Ok))?;
let exit = machine.run();
let cycles = machine.machine.cycles();
println!(
Expand All @@ -71,7 +71,7 @@ fn main_int(code: Bytes, args: Vec<Bytes>) -> Result<(), Box<dyn std::error::Err
let machine_builder = ckb_vm::DefaultMachineBuilder::new(core_machine)
.instruction_cycle_func(Box::new(estimate_cycles));
let mut machine = machine_builder.syscall(Box::new(DebugSyscall {})).build();
machine.load_program(&code, &args)?;
machine.load_program(&code, args.into_iter().map(Ok))?;
let exit = machine.run();
let cycles = machine.cycles();
println!(
Expand Down
6 changes: 3 additions & 3 deletions src/lib.rs
Original file line number Diff line number Diff line change
Expand Up @@ -22,7 +22,7 @@ pub use crate::{
instructions::{Instruction, Register},
machine::{
trace::TraceMachine, CoreMachine, DefaultCoreMachine, DefaultMachine,
DefaultMachineBuilder, InstructionCycleFunc, Machine, SupportMachine,
DefaultMachineBuilder, FlattenedArgsReader, InstructionCycleFunc, Machine, SupportMachine,
},
memory::{flat::FlatMemory, sparse::SparseMemory, wxorx::WXorXMemory, Memory},
syscalls::Syscalls,
Expand All @@ -47,7 +47,7 @@ pub fn run<R: Register, M: Memory<REG = R> + Default>(
WXorXMemory::new(M::default()),
);
let mut machine = TraceMachine::new(DefaultMachineBuilder::new(core_machine).build());
machine.load_program(program, args)?;
machine.load_program(program, args.into_iter().map(|e| Ok(e.clone())))?;
machine.run()
}

Expand All @@ -63,7 +63,7 @@ pub fn run_with_memory<R: Register, M: Memory<REG = R>>(
WXorXMemory::new(memory),
);
let mut machine = TraceMachine::new(DefaultMachineBuilder::new(core_machine).build());
machine.load_program(program, args)?;
machine.load_program(program, args.into_iter().map(|e| Ok(e.clone())))?;
machine.run()
}

Expand Down
8 changes: 6 additions & 2 deletions src/machine/asm/mod.rs
Original file line number Diff line number Diff line change
Expand Up @@ -666,15 +666,19 @@ impl AsmMachine {
self.machine.inner.max_cycles = cycles;
}

pub fn load_program(&mut self, program: &Bytes, args: &[Bytes]) -> Result<u64, Error> {
pub fn load_program(
&mut self,
program: &Bytes,
args: impl ExactSizeIterator<Item = Result<Bytes, Error>>,
) -> Result<u64, Error> {
self.machine.load_program(program, args)
}

pub fn load_program_with_metadata(
&mut self,
program: &Bytes,
metadata: &ProgramMetadata,
args: &[Bytes],
args: impl ExactSizeIterator<Item = Result<Bytes, Error>>,
) -> Result<u64, Error> {
self.machine
.load_program_with_metadata(program, metadata, args)
Expand Down
84 changes: 75 additions & 9 deletions src/machine/mod.rs
Original file line number Diff line number Diff line change
Expand Up @@ -12,7 +12,7 @@ use super::debugger::Debugger;
use super::decoder::{build_decoder, InstDecoder};
use super::elf::{parse_elf, LoadingAction, ProgramMetadata};
use super::instructions::{execute, Instruction, Register};
use super::memory::Memory;
use super::memory::{load_c_string, Memory};
use super::syscalls::Syscalls;
use super::{
registers::{A0, A7, REGISTER_ABI_NAMES, SP},
Expand Down Expand Up @@ -171,7 +171,7 @@ pub trait SupportMachine: CoreMachine {

fn initialize_stack(
&mut self,
args: &[Bytes],
args: impl ExactSizeIterator<Item = Result<Bytes, Error>>,
stack_start: u64,
stack_size: u64,
) -> Result<u64, Error> {
Expand All @@ -183,7 +183,7 @@ pub trait SupportMachine: CoreMachine {
// reading "argc" will return an unexpected data. This situation is not very common.
//
// See https://github.com/nervosnetwork/ckb-vm/issues/106 for more details.
if self.version() >= VERSION1 && args.is_empty() {
if self.version() >= VERSION1 && args.len() == 0 {
let argc_size = u64::from(Self::REG::BITS / 8);
let origin_sp = stack_start + stack_size;
let unaligned_sp_address = origin_sp - argc_size;
Expand All @@ -200,15 +200,21 @@ pub trait SupportMachine: CoreMachine {
// of each argv object.
let mut values = vec![Self::REG::from_u64(args.len() as u64)];
for arg in args {
let arg = arg?;
let len = Self::REG::from_u64(arg.len() as u64 + 1);
let address = self.registers()[SP].overflowing_sub(&len);

self.memory_mut().store_bytes(address.to_u64(), arg)?;
self.memory_mut().store_bytes(address.to_u64(), &arg)?;
self.memory_mut()
.store_byte(address.to_u64() + arg.len() as u64, 1, 0)?;

values.push(address.clone());
self.set_register(SP, address);
self.set_register(SP, address.clone());

if self.version() >= VERSION2 && address.to_u64() < stack_start {
// Provides an early exit to large argv array.
return Err(Error::MemOutOfStack);
}
}
if self.version() >= VERSION1 {
// There are 2 standard requirements of the initialized stack:
Expand Down Expand Up @@ -246,7 +252,7 @@ pub trait SupportMachine: CoreMachine {
self.set_register(SP, address);
}
if self.registers()[SP].to_u64() < stack_start {
// args exceed stack size
// Args exceed stack size.
return Err(Error::MemOutOfStack);
}
Ok(stack_start + stack_size - self.registers()[SP].to_u64())
Expand Down Expand Up @@ -575,7 +581,11 @@ impl<Inner: CoreMachine> Display for DefaultMachine<Inner> {
}

impl<Inner: SupportMachine> DefaultMachine<Inner> {
pub fn load_program(&mut self, program: &Bytes, args: &[Bytes]) -> Result<u64, Error> {
pub fn load_program(
&mut self,
program: &Bytes,
args: impl ExactSizeIterator<Item = Result<Bytes, Error>>,
) -> Result<u64, Error> {
let elf_bytes = self.load_elf(program, true)?;
let stack_bytes = self.initialize(args)?;
let bytes = elf_bytes.checked_add(stack_bytes).ok_or_else(|| {
Expand All @@ -590,7 +600,7 @@ impl<Inner: SupportMachine> DefaultMachine<Inner> {
&mut self,
program: &Bytes,
metadata: &ProgramMetadata,
args: &[Bytes],
args: impl ExactSizeIterator<Item = Result<Bytes, Error>>,
) -> Result<u64, Error> {
let elf_bytes = self.load_binary(program, metadata, true)?;
let stack_bytes = self.initialize(args)?;
Expand All @@ -602,7 +612,10 @@ impl<Inner: SupportMachine> DefaultMachine<Inner> {
Ok(bytes)
}

fn initialize(&mut self, args: &[Bytes]) -> Result<u64, Error> {
fn initialize(
&mut self,
args: impl ExactSizeIterator<Item = Result<Bytes, Error>>,
) -> Result<u64, Error> {
for syscall in &mut self.syscalls {
syscall.initialize(&mut self.inner)?;
}
Expand Down Expand Up @@ -766,6 +779,59 @@ impl Pause {
}
}

pub struct FlattenedArgsReader<'a, M: Memory> {
memory: &'a mut M,
argc: M::REG,
argv: M::REG,
cidx: M::REG,
}

impl<'a, M: Memory> FlattenedArgsReader<'a, M> {
pub fn new(memory: &'a mut M, argc: M::REG, argv: M::REG) -> Self {
Self {
memory,
argc,
argv,
cidx: M::REG::zero(),
}
}
}

impl<'a, M: Memory> Iterator for FlattenedArgsReader<'a, M> {
type Item = Result<Bytes, Error>;

fn next(&mut self) -> Option<Self::Item> {
if self.cidx.ge(&self.argc).to_u8() == 1 {
return None;
}
let addr = match M::REG::BITS {
32 => self.memory.load32(&self.argv),
64 => self.memory.load64(&self.argv),
_ => unreachable!(),
};
if let Err(err) = addr {
return Some(Err(err));
};
let addr = addr.unwrap();
let cstr = load_c_string(self.memory, &addr);
if let Err(err) = cstr {
return Some(Err(err));
};
let cstr = cstr.unwrap();
self.cidx = self.cidx.overflowing_add(&M::REG::from_u8(1));
self.argv = self
.argv
.overflowing_add(&M::REG::from_u8(M::REG::BITS / 8));
Some(Ok(cstr))
}
}

impl<'a, M: Memory> ExactSizeIterator for FlattenedArgsReader<'a, M> {
fn len(&self) -> usize {
self.argc.to_u64() as usize
}
}

#[cfg(test)]
mod tests {
use std::sync::atomic::AtomicU8;
Expand Down
8 changes: 6 additions & 2 deletions src/machine/trace.rs
Original file line number Diff line number Diff line change
Expand Up @@ -113,15 +113,19 @@ impl<Inner: SupportMachine> TraceMachine<Inner> {
}
}

pub fn load_program(&mut self, program: &Bytes, args: &[Bytes]) -> Result<u64, Error> {
pub fn load_program(
&mut self,
program: &Bytes,
args: impl ExactSizeIterator<Item = Result<Bytes, Error>>,
) -> Result<u64, Error> {
self.machine.load_program(program, args)
}

pub fn load_program_with_metadata(
&mut self,
program: &Bytes,
metadata: &ProgramMetadata,
args: &[Bytes],
args: impl ExactSizeIterator<Item = Result<Bytes, Error>>,
) -> Result<u64, Error> {
self.machine
.load_program_with_metadata(program, metadata, args)
Expand Down
14 changes: 14 additions & 0 deletions src/memory/mod.rs
Original file line number Diff line number Diff line change
Expand Up @@ -151,3 +151,17 @@ pub(crate) fn memset(slice: &mut [u8], value: u8) {
ptr::write_bytes(p, value, slice.len());
}
}

pub fn load_c_string<M: Memory>(memory: &mut M, addr: &M::REG) -> Result<Bytes, Error> {
let mut buffer = Vec::new();
let mut addr = addr.clone();
loop {
let byte = memory.load8(&addr)?.to_u8();
if byte == 0 {
break;
}
buffer.push(byte);
addr = addr.overflowing_add(&M::REG::from_u8(1));
}
Ok(Bytes::from(buffer))
}
12 changes: 6 additions & 6 deletions tests/machine_build.rs
Original file line number Diff line number Diff line change
Expand Up @@ -37,9 +37,9 @@ pub fn asm(path: &str, args: Vec<Bytes>, version: u32, isa: u8) -> AsmMachine {
.syscall(Box::new(SleepSyscall {}))
.build();
let mut machine = AsmMachine::new(core);
let mut argv = vec![Bytes::from("main")];
argv.extend_from_slice(&args);
machine.load_program(&buffer, &argv).unwrap();
let mut argv = vec![Ok(Bytes::from("main"))];
argv.extend(args.into_iter().map(Ok));
machine.load_program(&buffer, argv.into_iter()).unwrap();
machine
}

Expand All @@ -58,8 +58,8 @@ pub fn int(
.syscall(Box::new(SleepSyscall {}))
.build(),
);
let mut argv = vec![Bytes::from("main")];
argv.extend_from_slice(&args);
machine.load_program(&buffer, &argv).unwrap();
let mut argv = vec![Ok(Bytes::from("main"))];
argv.extend(args.into_iter().map(Ok));
machine.load_program(&buffer, argv.into_iter()).unwrap();
machine
}
Loading

0 comments on commit 10ec946

Please sign in to comment.