mirror of
https://github.com/NotAShelf/microfetch.git
synced 2026-04-27 10:55:20 +00:00
418 lines
11 KiB
Rust
418 lines
11 KiB
Rust
//! Incredibly fast syscall wrappers for using inline assembly. Serves the
|
|
//! purposes of completely bypassing Rust's standard library in favor of
|
|
//! handwritten Assembly. Is this a good idea? No. Is it fast? Yeah, but only
|
|
//! marginally. Either way it serves a purpose and I will NOT accept criticism.
|
|
//! What do you mean I wasted two whole hours to make the program only 100µs
|
|
//! faster?
|
|
//!
|
|
//! Supports `x86_64`, `aarch64`, `riscv64`, and `loongarch64` architectures.
|
|
|
|
#![no_std]
|
|
|
|
// Ensure we're compiling for a supported architecture.
|
|
#[cfg(not(any(
|
|
target_arch = "x86_64",
|
|
target_arch = "aarch64",
|
|
target_arch = "riscv64",
|
|
target_arch = "loongarch64"
|
|
)))]
|
|
compile_error!(
|
|
"Unsupported architecture: only x86_64, aarch64, riscv64, and loongarch64 \
|
|
are supported"
|
|
);
|
|
|
|
// Per-arch syscall implementations live in their own module files.
|
|
#[cfg(target_arch = "x86_64")]
|
|
#[path = "x86_64.rs"]
|
|
mod arch;
|
|
#[cfg(target_arch = "aarch64")]
|
|
#[path = "aarch64.rs"]
|
|
mod arch;
|
|
#[cfg(target_arch = "riscv64")]
|
|
#[path = "riscv64.rs"]
|
|
mod arch;
|
|
#[cfg(target_arch = "loongarch64")]
|
|
#[path = "loongarch64.rs"]
|
|
mod arch;
|
|
|
|
/// Copies `n` bytes from `src` to `dest`.
|
|
///
|
|
/// # Safety
|
|
///
|
|
/// `dest` and `src` must be valid pointers to non-overlapping regions of
|
|
/// memory of at least `n` bytes.
|
|
#[unsafe(no_mangle)]
|
|
pub unsafe extern "C" fn memcpy(
|
|
dest: *mut u8,
|
|
src: *const u8,
|
|
n: usize,
|
|
) -> *mut u8 {
|
|
for i in 0..n {
|
|
unsafe {
|
|
*dest.add(i) = *src.add(i);
|
|
}
|
|
}
|
|
dest
|
|
}
|
|
|
|
/// Fills memory region with a byte value.
|
|
///
|
|
/// # Safety
|
|
///
|
|
/// `s` must be a valid pointer to memory of at least `n` bytes.
|
|
/// The value in `c` is treated as unsigned (lower 8 bits used).
|
|
#[unsafe(no_mangle)]
|
|
pub unsafe extern "C" fn memset(s: *mut u8, c: i32, n: usize) -> *mut u8 {
|
|
for i in 0..n {
|
|
unsafe {
|
|
*s.add(i) = u8::try_from(c).unwrap_or(0);
|
|
}
|
|
}
|
|
s
|
|
}
|
|
|
|
/// Compares two byte sequences.
|
|
///
|
|
/// # Safety
|
|
///
|
|
/// `s1` and `s2` must be valid pointers to memory of at least `n` bytes.
|
|
#[unsafe(no_mangle)]
|
|
pub unsafe extern "C" fn bcmp(s1: *const u8, s2: *const u8, n: usize) -> i32 {
|
|
for i in 0..n {
|
|
let a = unsafe { *s1.add(i) };
|
|
let b = unsafe { *s2.add(i) };
|
|
if a != b {
|
|
return i32::from(a) - i32::from(b);
|
|
}
|
|
}
|
|
0
|
|
}
|
|
|
|
/// Compares two byte sequences.
|
|
///
|
|
/// # Safety
|
|
///
|
|
/// `s1` and `s2` must be valid pointers to memory of at least `n` bytes.
|
|
#[unsafe(no_mangle)]
|
|
pub unsafe extern "C" fn memcmp(s1: *const u8, s2: *const u8, n: usize) -> i32 {
|
|
unsafe { bcmp(s1, s2, n) }
|
|
}
|
|
|
|
/// Calculates the length of a null-terminated string.
|
|
///
|
|
/// # Safety
|
|
///
|
|
/// `s` must be a valid pointer to a null-terminated string.
|
|
#[unsafe(no_mangle)]
|
|
pub const unsafe extern "C" fn strlen(s: *const u8) -> usize {
|
|
let mut len = 0;
|
|
while unsafe { *s.add(len) } != 0 {
|
|
len += 1;
|
|
}
|
|
len
|
|
}
|
|
|
|
/// Function pointer type for the main application entry point.
|
|
/// The function receives argc and argv and should return an exit code.
|
|
#[cfg(not(test))]
|
|
pub type MainFn = unsafe extern "C" fn(i32, *const *const u8) -> i32;
|
|
|
|
#[cfg(not(test))]
|
|
static mut MAIN_FN: Option<MainFn> = None;
|
|
|
|
/// Register the main function to be called from the entry point.
|
|
/// This must be called before the program starts (e.g., in a constructor).
|
|
#[cfg(not(test))]
|
|
pub fn register_main(main_fn: MainFn) {
|
|
unsafe {
|
|
MAIN_FN = Some(main_fn);
|
|
}
|
|
}
|
|
|
|
/// Rust entry point called from `_start` assembly.
|
|
///
|
|
/// The `stack` pointer points to:
|
|
/// `[rsp]` = argc
|
|
/// `[rsp+8]` = argv[0]
|
|
/// etc.
|
|
///
|
|
/// # Safety
|
|
///
|
|
/// The `stack` pointer must point to valid stack memory set up by the kernel
|
|
/// AND the binary must define a `main` function with the following signature:
|
|
///
|
|
/// ```rust,ignore
|
|
/// unsafe extern "C" fn main(argc: i32, argv: *const *const u8) -> i32`
|
|
/// ```
|
|
#[cfg(not(test))]
|
|
#[unsafe(no_mangle)]
|
|
pub unsafe extern "C" fn entry_rust(stack: *const usize) -> i32 {
|
|
// Read argc and argv from stack
|
|
let argc = unsafe { *stack };
|
|
let argv = unsafe { stack.add(1).cast::<*const u8>() };
|
|
|
|
// SAFETY: argc is unlikely to exceed i32::MAX on real systems
|
|
let argc_i32 = i32::try_from(argc).unwrap_or(i32::MAX);
|
|
|
|
// Call the main function (defined by the binary crate)
|
|
unsafe { main(argc_i32, argv) }
|
|
}
|
|
|
|
// External main function that must be defined by the binary using this crate.
|
|
// Signature: `unsafe extern "C" fn main(argc: i32, argv: *const *const u8) ->
|
|
// i32`
|
|
#[cfg(not(test))]
|
|
unsafe extern "C" {
|
|
fn main(argc: i32, argv: *const *const u8) -> i32;
|
|
}
|
|
|
|
/// Direct syscall to open a file
|
|
///
|
|
/// # Returns
|
|
///
|
|
/// File descriptor or -1 on error
|
|
///
|
|
/// # Safety
|
|
///
|
|
/// The caller must ensure:
|
|
///
|
|
/// - `path` points to a valid null-terminated C string
|
|
/// - The pointer remains valid for the duration of the syscall
|
|
#[inline]
|
|
#[must_use]
|
|
pub unsafe fn sys_open(path: *const u8, flags: i32) -> i32 {
|
|
unsafe { arch::sys_open(path, flags) }
|
|
}
|
|
|
|
/// Direct syscall to read from a file descriptor
|
|
///
|
|
/// # Returns
|
|
///
|
|
/// Number of bytes read or -1 on error
|
|
///
|
|
/// # Safety
|
|
///
|
|
/// The caller must ensure that:
|
|
///
|
|
/// - `buf` points to a valid writable buffer of at least `count` bytes
|
|
/// - `fd` is a valid open file descriptor
|
|
#[inline]
|
|
pub unsafe fn sys_read(fd: i32, buf: *mut u8, count: usize) -> isize {
|
|
unsafe { arch::sys_read(fd, buf, count) }
|
|
}
|
|
|
|
/// Direct syscall to write to a file descriptor
|
|
///
|
|
/// # Returns
|
|
///
|
|
/// Number of bytes written or -1 on error
|
|
///
|
|
/// # Safety
|
|
///
|
|
/// The caller must ensure that:
|
|
///
|
|
/// - `buf` points to a valid readable buffer of at least `count` bytes
|
|
/// - `fd` is a valid open file descriptor
|
|
#[inline]
|
|
#[must_use]
|
|
pub unsafe fn sys_write(fd: i32, buf: *const u8, count: usize) -> isize {
|
|
unsafe { arch::sys_write(fd, buf, count) }
|
|
}
|
|
|
|
/// Direct syscall to close a file descriptor
|
|
///
|
|
/// # Safety
|
|
///
|
|
/// The caller must ensure that `fd` is a valid open file descriptor
|
|
#[inline]
|
|
#[must_use]
|
|
pub unsafe fn sys_close(fd: i32) -> i32 {
|
|
unsafe { arch::sys_close(fd) }
|
|
}
|
|
|
|
/// Raw buffer for the `uname(2)` syscall.
|
|
///
|
|
/// Linux ABI hasfive fields of `[i8; 65]`: sysname, nodename, release, version,
|
|
/// machine. The `domainname` field (GNU extension, `[i8; 65]`) follows but is
|
|
/// not used, nor any useful to us here.
|
|
#[repr(C)]
|
|
#[allow(dead_code)]
|
|
pub struct UtsNameBuf {
|
|
pub sysname: [i8; 65],
|
|
pub nodename: [i8; 65],
|
|
pub release: [i8; 65],
|
|
pub version: [i8; 65],
|
|
pub machine: [i8; 65],
|
|
pub domainname: [i8; 65], // GNU extension, included for correct struct size
|
|
}
|
|
|
|
/// Direct `uname(2)` syscall
|
|
///
|
|
/// # Returns
|
|
///
|
|
/// 0 on success, negative on error
|
|
///
|
|
/// # Safety
|
|
///
|
|
/// The caller must ensure that `buf` points to a valid `UtsNameBuf`.
|
|
#[inline]
|
|
#[allow(dead_code)]
|
|
pub unsafe fn sys_uname(buf: *mut UtsNameBuf) -> i32 {
|
|
unsafe { arch::sys_uname(buf) }
|
|
}
|
|
|
|
/// Raw buffer for the `statfs(2)` syscall.
|
|
///
|
|
/// Linux ABI (`x86_64` and `aarch64`): the fields we use are at the same
|
|
/// offsets on both architectures. Only the fields needed for disk usage are
|
|
/// declared; the remainder of the 120-byte struct is covered by `_pad`.
|
|
#[repr(C)]
|
|
pub struct StatfsBuf {
|
|
pub f_type: i64,
|
|
pub f_bsize: i64,
|
|
pub f_blocks: u64,
|
|
pub f_bfree: u64,
|
|
pub f_bavail: u64,
|
|
pub f_files: u64,
|
|
pub f_ffree: u64,
|
|
pub f_fsid: [i32; 2],
|
|
pub f_namelen: i64,
|
|
pub f_frsize: i64,
|
|
pub f_flags: i64,
|
|
|
|
#[allow(clippy::pub_underscore_fields, reason = "This is not a public API")]
|
|
pub _pad: [i64; 4],
|
|
}
|
|
|
|
/// Direct `statfs(2)` syscall
|
|
///
|
|
/// # Returns
|
|
///
|
|
/// 0 on success, negative errno on error
|
|
///
|
|
/// # Safety
|
|
///
|
|
/// The caller must ensure that:
|
|
///
|
|
/// - `path` points to a valid null-terminated string
|
|
/// - `buf` points to a valid `StatfsBuf`
|
|
#[inline]
|
|
pub unsafe fn sys_statfs(path: *const u8, buf: *mut StatfsBuf) -> i32 {
|
|
unsafe { arch::sys_statfs(path, buf) }
|
|
}
|
|
|
|
/// Read entire file using direct syscalls. This avoids libc overhead and can be
|
|
/// significantly faster for small files.
|
|
///
|
|
/// # Errors
|
|
///
|
|
/// Returns an error if the file cannot be opened or read. The error value is
|
|
/// the negated errno.
|
|
#[inline]
|
|
pub fn read_file_fast(path: &str, buffer: &mut [u8]) -> Result<usize, i32> {
|
|
const O_RDONLY: i32 = 0;
|
|
|
|
// We use stack-allocated buffer for null-terminated path. The maximum
|
|
// is 256 bytes.
|
|
let path_bytes = path.as_bytes();
|
|
if path_bytes.len() >= 256 {
|
|
return Err(-22); // EINVAL
|
|
}
|
|
|
|
let mut path_buf = [0u8; 256];
|
|
path_buf[..path_bytes.len()].copy_from_slice(path_bytes);
|
|
// XXX: Already zero-terminated since array is initialized to zeros
|
|
|
|
unsafe {
|
|
let fd = sys_open(path_buf.as_ptr(), O_RDONLY);
|
|
if fd < 0 {
|
|
return Err(fd);
|
|
}
|
|
|
|
let bytes_read = sys_read(fd, buffer.as_mut_ptr(), buffer.len());
|
|
let _ = sys_close(fd);
|
|
|
|
if bytes_read < 0 {
|
|
#[allow(clippy::cast_possible_truncation)]
|
|
return Err(bytes_read as i32);
|
|
}
|
|
|
|
#[allow(clippy::cast_sign_loss)]
|
|
{
|
|
Ok(bytes_read as usize)
|
|
}
|
|
}
|
|
}
|
|
|
|
/// Raw buffer for the `sysinfo(2)` syscall.
|
|
///
|
|
/// In the Linux ABI `uptime` is a `long` at offset 0. The remaining fields are
|
|
/// not needed, but are declared to give the struct its correct size (112 bytes
|
|
/// on 64-bit Linux).
|
|
///
|
|
/// The layout matches the kernel's `struct sysinfo` *exactly*:
|
|
/// `mem_unit` ends at offset 108, then 4 bytes of implicit padding to 112.
|
|
#[repr(C)]
|
|
pub struct SysInfo {
|
|
pub uptime: i64,
|
|
pub loads: [u64; 3],
|
|
pub totalram: u64,
|
|
pub freeram: u64,
|
|
pub sharedram: u64,
|
|
pub bufferram: u64,
|
|
pub totalswap: u64,
|
|
pub freeswap: u64,
|
|
pub procs: u16,
|
|
_pad: u16,
|
|
_pad2: u32, /* alignment padding to reach 8-byte boundary for
|
|
* totalhigh */
|
|
pub totalhigh: u64,
|
|
pub freehigh: u64,
|
|
pub mem_unit: u32,
|
|
// 4 bytes implicit trailing padding to reach 112 bytes total; no field
|
|
// needed
|
|
}
|
|
|
|
/// Direct `sysinfo(2)` syscall
|
|
///
|
|
/// # Returns
|
|
///
|
|
/// 0 on success, negative errno on error
|
|
///
|
|
/// # Safety
|
|
///
|
|
/// The caller must ensure that `info` points to a valid `SysInfo` buffer.
|
|
#[inline]
|
|
pub unsafe fn sys_sysinfo(info: *mut SysInfo) -> i64 {
|
|
unsafe { arch::sys_sysinfo(info) }
|
|
}
|
|
|
|
/// Direct `sched_getaffinity(2)` syscall
|
|
///
|
|
/// # Returns
|
|
///
|
|
/// On success, the number of bytes written to the mask buffer (always a
|
|
/// multiple of `sizeof(long)`). On error, a negative errno.
|
|
///
|
|
/// # Safety
|
|
///
|
|
/// The caller must ensure that `mask` points to a buffer of at least
|
|
/// `mask_size` bytes.
|
|
#[inline]
|
|
pub unsafe fn sys_sched_getaffinity(
|
|
pid: i32,
|
|
mask_size: usize,
|
|
mask: *mut u8,
|
|
) -> i32 {
|
|
unsafe { arch::sys_sched_getaffinity(pid, mask_size, mask) }
|
|
}
|
|
|
|
/// Direct syscall to exit the process
|
|
///
|
|
/// # Safety
|
|
///
|
|
/// This syscall never returns. The process will terminate immediately.
|
|
#[inline]
|
|
pub unsafe fn sys_exit(code: i32) -> ! {
|
|
unsafe { arch::sys_exit(code) }
|
|
}
|