mirror of
https://github.com/NotAShelf/microfetch.git
synced 2025-12-08 05:53:51 +00:00
Signed-off-by: NotAShelf <raf@notashelf.dev> Change-Id: Ie1a13221aded56f903156fdb35abe2ac6a6a6964
210 lines
5 KiB
Rust
210 lines
5 KiB
Rust
//! Incredibly fast syscall wrappers for using inline assembly. Serves the
|
|
//! purposes of completely bypassing Rust's standard library in favor of
|
|
//! handwritten Assembly. Is this a good idea? No. Is it fast? Yeah, but only
|
|
//! marginally. Either way it serves a purpose and I will NOT accept criticism.
|
|
//! What do you mean I wasted two whole hours to make the program only 100µs
|
|
//! faster?
|
|
//!
|
|
//! Supports `x86_64` and `aarch64` architectures. Riscv support will be
|
|
//! implemented when and ONLY WHEN I can be bothered to work on it.
|
|
|
|
use std::io;
|
|
|
|
/// Direct syscall to open a file
|
|
///
|
|
/// # Returns
|
|
///
|
|
/// File descriptor or -1 on error
|
|
///
|
|
/// # Safety
|
|
///
|
|
/// The caller must ensure:
|
|
///
|
|
/// - `path` points to a valid null-terminated C string
|
|
/// - The pointer remains valid for the duration of the syscall
|
|
#[inline]
|
|
#[must_use]
|
|
pub unsafe fn sys_open(path: *const u8, flags: i32) -> i32 {
|
|
#[cfg(target_arch = "x86_64")]
|
|
unsafe {
|
|
let fd: i64;
|
|
std::arch::asm!(
|
|
"syscall",
|
|
in("rax") 2i64, // SYS_open
|
|
in("rdi") path,
|
|
in("rsi") flags,
|
|
in("rdx") 0i32, // mode (not used for reading)
|
|
lateout("rax") fd,
|
|
lateout("rcx") _,
|
|
lateout("r11") _,
|
|
options(nostack)
|
|
);
|
|
#[allow(clippy::cast_possible_truncation)]
|
|
{
|
|
fd as i32
|
|
}
|
|
}
|
|
#[cfg(target_arch = "aarch64")]
|
|
unsafe {
|
|
let fd: i64;
|
|
std::arch::asm!(
|
|
"svc #0",
|
|
in("x8") 56i64, // SYS_openat
|
|
in("x0") -100i32, // AT_FDCWD
|
|
in("x1") path,
|
|
in("x2") flags,
|
|
in("x3") 0i32, // mode
|
|
lateout("x0") fd,
|
|
options(nostack)
|
|
);
|
|
#[allow(clippy::cast_possible_truncation)]
|
|
{
|
|
fd as i32
|
|
}
|
|
}
|
|
#[cfg(not(any(target_arch = "x86_64", target_arch = "aarch64")))]
|
|
{
|
|
compile_error!("Unsupported architecture for inline assembly syscalls");
|
|
}
|
|
}
|
|
|
|
/// Direct syscall to read from a file descriptor
|
|
///
|
|
/// # Returns n
|
|
///
|
|
/// Number of bytes read or -1 on error
|
|
///
|
|
/// # Safety
|
|
///
|
|
/// The caller must ensure:
|
|
/// - `buf` points to a valid writable buffer of at least `count` bytes
|
|
/// - `fd` is a valid open file descriptor
|
|
#[inline]
|
|
pub unsafe fn sys_read(fd: i32, buf: *mut u8, count: usize) -> isize {
|
|
#[cfg(target_arch = "x86_64")]
|
|
unsafe {
|
|
let ret: i64;
|
|
std::arch::asm!(
|
|
"syscall",
|
|
in("rax") 0i64, // SYS_read
|
|
in("rdi") fd,
|
|
in("rsi") buf,
|
|
in("rdx") count,
|
|
lateout("rax") ret,
|
|
lateout("rcx") _,
|
|
lateout("r11") _,
|
|
options(nostack)
|
|
);
|
|
#[allow(clippy::cast_possible_truncation)]
|
|
{
|
|
ret as isize
|
|
}
|
|
}
|
|
#[cfg(target_arch = "aarch64")]
|
|
unsafe {
|
|
let ret: i64;
|
|
std::arch::asm!(
|
|
"svc #0",
|
|
in("x8") 63i64, // SYS_read
|
|
in("x0") fd,
|
|
in("x1") buf,
|
|
in("x2") count,
|
|
lateout("x0") ret,
|
|
options(nostack)
|
|
);
|
|
#[allow(clippy::cast_possible_truncation)]
|
|
{
|
|
ret as isize
|
|
}
|
|
}
|
|
#[cfg(not(any(target_arch = "x86_64", target_arch = "aarch64")))]
|
|
{
|
|
compile_error!("Unsupported architecture for inline assembly syscalls");
|
|
}
|
|
}
|
|
|
|
/// Direct syscall to close a file descriptor
|
|
///
|
|
/// # Safety
|
|
///
|
|
/// The caller must ensure `fd` is a valid open file descriptor
|
|
#[inline]
|
|
#[must_use]
|
|
pub unsafe fn sys_close(fd: i32) -> i32 {
|
|
#[cfg(target_arch = "x86_64")]
|
|
unsafe {
|
|
let ret: i64;
|
|
std::arch::asm!(
|
|
"syscall",
|
|
in("rax") 3i64, // SYS_close
|
|
in("rdi") fd,
|
|
lateout("rax") ret,
|
|
lateout("rcx") _,
|
|
lateout("r11") _,
|
|
options(nostack)
|
|
);
|
|
#[allow(clippy::cast_possible_truncation)]
|
|
{
|
|
ret as i32
|
|
}
|
|
}
|
|
#[cfg(target_arch = "aarch64")]
|
|
unsafe {
|
|
let ret: i64;
|
|
std::arch::asm!(
|
|
"svc #0",
|
|
in("x8") 57i64, // SYS_close
|
|
in("x0") fd,
|
|
lateout("x0") ret,
|
|
options(nostack)
|
|
);
|
|
#[allow(clippy::cast_possible_truncation)]
|
|
{
|
|
ret as i32
|
|
}
|
|
}
|
|
#[cfg(not(any(target_arch = "x86_64", target_arch = "aarch64")))]
|
|
{
|
|
compile_error!("Unsupported architecture for inline assembly syscalls");
|
|
}
|
|
}
|
|
|
|
/// Read entire file using direct syscalls. This avoids libc overhead and can be
|
|
/// significantly faster for small files.
|
|
///
|
|
/// # Errors
|
|
///
|
|
/// Returns an error if the file cannot be opened or read
|
|
#[inline]
|
|
pub fn read_file_fast(path: &str, buffer: &mut [u8]) -> io::Result<usize> {
|
|
const O_RDONLY: i32 = 0;
|
|
|
|
// Use stack-allocated buffer for null-terminated path (max 256 bytes)
|
|
let path_bytes = path.as_bytes();
|
|
if path_bytes.len() >= 256 {
|
|
return Err(io::Error::new(io::ErrorKind::InvalidInput, "Path too long"));
|
|
}
|
|
|
|
let mut path_buf = [0u8; 256];
|
|
path_buf[..path_bytes.len()].copy_from_slice(path_bytes);
|
|
// XXX: Already zero-terminated since array is initialized to zeros
|
|
|
|
unsafe {
|
|
let fd = sys_open(path_buf.as_ptr(), O_RDONLY);
|
|
if fd < 0 {
|
|
return Err(io::Error::last_os_error());
|
|
}
|
|
|
|
let bytes_read = sys_read(fd, buffer.as_mut_ptr(), buffer.len());
|
|
let _ = sys_close(fd);
|
|
|
|
if bytes_read < 0 {
|
|
return Err(io::Error::last_os_error());
|
|
}
|
|
|
|
#[allow(clippy::cast_sign_loss)]
|
|
{
|
|
Ok(bytes_read as usize)
|
|
}
|
|
}
|
|
}
|