Explaining 200 Line Lightweight Streams in Rust
Lightweight threads (coroutines, coroutines, green threads) are a very powerful mechanism in modern programming languages. In this article, Carl Fredrik Samson tried to implement a runtime for lightweight streams on Rast, along the way explaining how they work under the hood.
It should also be noted that the article is not super fresh, so in order for the examples to work in the modern nightly version of the Rust compiler, you will most likely need changes that can be found in the code repository for this article.
He translated for himself for the most part. Write about all the comments - I will correct it promptly. I tried to translate the text closely, but in some places I reformulated it to make it easier to read and understand.
Green Threads
Green threads solve a common problem in programming - you don't want your code to block the processor, wasting resources. This is solved by using multitasking, which allows you to pause the execution of one piece of code, launching another for execution, switching between "contexts".
, — . — . , .
:
- ()
, . — "-" ( - ). , , UI (User Interface — ) , . , , , .
. , - , , - . (yielding
control) . - , - . , /. , , - , .
, , . , . .
-, . , .. . , .
— x86-64. 16 :
, "callee saved". , — , , .. .
, . , . :
mov %rsp, %rax
. . , , ( )
: AT&T .
AT&T Rust. , . LLVM. LLVM , .
AT&T.
. , . %rax
, :
%rax # 64 (8 ) %eax # 32 "rax" %ax # 16 "rax" %ah # 8 "ax" "rax" %al # 8 "rax"
+-----------------------------------------------------------------------+ |76543210 76543210 76543210 76543210 76543210 76543210 76543210 76543210| +--------+--------+--------+--------+--------+--------+--------+--------+ | | | | | | | %ah | %al | +--------+--------+--------+--------+--------+--------+--------+--------+ | | | | | | | %ax | +--------+--------+--------+--------+--------+--------+-----------------+ | | | | | %eax | +--------+--------+--------+--------+-----------------------------------+ | %rax | +-----------------------------------------------------------------------+
, . 64, 64 .
"" . , 16 , 16 . , .. AT&T q
(quad-word — ) l
(long-word — ). movq
4 * 16 = 64 .
mov
, . AT&T.
16 x86-64. .
,
, .
"green_threads".
cargo init
- , , :
rustup override set nightly
main.rs
, llvm_asm!
:
#![feature(llvm_asm)]
, 48 , .
const SSIZE: isize = 48;
, . , , , , .
#[derive(Debug, Default)]
#[repr(C)]
struct ThreadContext {
rsp: u64,
}
, "callee saved" , . ABI x86-64. , .
, - , #[repr(C)]
. ABI, , rsp
8 . ABI, .
fn hello() -> ! {
println!("I LOVE WAKING UP ON A NEW STACK!");
loop {}
}
, , .
, :
unsafe fn gt_switch(new: *const ThreadContext) {
llvm_asm!("
mov 0x00($0), %rsp
ret
"
:
: "r"(new)
:
: "alignstack" // ,
);
}
. , . , rsp
( new.rsp
, , ). ?
ret
, . %rsp
, , , . ret
, .
, , .
, . . , :
unsafe
— , , . , .
gt_switch(new: *const ThreadContext)
— ThreadContext
, .
llvm_asm!("
— . , - AT&T (-).
, — — mov 0x00($0), %rsp
. , , 0x00 ( ; ) $0 , rsp
. rsp
. , , .
$0
. . , 0, 1, 2 .., output
input
. , $0
.
$
, , , ( ), (, , x86 x86-64).
ret
— , , , . , .
output :
. , . output
, , .
input : "r"(new)
— input
. "r"
— , (constraint
). , (, - ). "r"
, . — , , , .
clobber list :
— clobber list
— , , , , . , , , , . .. , .
options : "alignstack"
— . : alignstack
, volatile
intel
. , . Windows alignstack
.
fn main() {
let mut ctx = ThreadContext::default();
let mut stack = vec![0_u8; SSIZE as usize];
unsafe {
let stack_bottom = stack.as_mut_ptr().offset(SSIZE);
let sb_aligned = (stack_bottom as usize & !15) as *mut u8;
std::ptr::write(sb_aligned.offset(-16) as *mut u64, hello as u64);
ctx.rsp = sb_aligned.offset(-16) as u64;
gt_switch(&mut ctx);
}
}
. hello
( ), u64
, 64 , .
, — ( ). 48 0 47, 32 16 / .
|0 1 2 3 4 |4 5 |0123456789 012345|6789 0123456789 01|23456789 01234567|89 0123456789 | | |XXXXXXXX | | | | stack bottom |0th byte |16th byte |32nd byte
, 16 (, 16 ?)
let sb_aligned = (stack_bottom as usize & !15) as *mut u8;
?Vec<u8>
, , 16 . , 16 . , .
, u64
u8
. u64
32-39, 8 . u64
- 32, , .
rsp
(Stack Pointer — ) 32 . u64
-, , .
cargo run
, :
dau@dau-work-pc:~/Projects/rust-programming-book/green_threads/green_threads$ cargo run Compiling green_threads v0.1.0 (/home/dau/Projects/rust-programming-book/green_threads/green_threads) Finished dev [unoptimized + debuginfo] target(s) in 0.44s Running `target/debug/green_threads` I LOVE WAKING UP ON A NEW STACK!
? hello
, . : . .
. . "" " " — .
, . (push/pop) , . .
— , , Rust Programming Language.
. 64 8 . , u8
, , , 000
, 0008
0016
.
, .
stack pointer
, 16 , , , , 16 ( — ). , , , 0008
(, ).
( gt_switch
), .
: — hello
, , .
print!(
"hello func address: 0x{addr:016X} ({addr})\n\n",
addr = hello as usize
);
for i in (0..SSIZE).rev() {
print!(
"mem: {}, value: 0x{:02X}\n{}",
stack.as_ptr().offset(i as isize) as usize,
*stack.as_ptr().offset(i as isize),
if i % 8 == 0 { "\n" } else { "" }
);
}
:
hello func address: 0x0000560CD80B50B0 (94613164216496) mem: 94613168839439, value: 0x00 mem: 94613168839438, value: 0x00 mem: 94613168839437, value: 0x00 mem: 94613168839436, value: 0x00 mem: 94613168839435, value: 0x00 mem: 94613168839434, value: 0x00 mem: 94613168839433, value: 0x00 mem: 94613168839432, value: 0x00 mem: 94613168839431, value: 0x00 mem: 94613168839430, value: 0x00 mem: 94613168839429, value: 0x56 mem: 94613168839428, value: 0x0C mem: 94613168839427, value: 0xD8 mem: 94613168839426, value: 0x0B mem: 94613168839425, value: 0x50 mem: 94613168839424, value: 0xB0 mem: 94613168839423, value: 0x00 mem: 94613168839422, value: 0x00 mem: 94613168839421, value: 0x00 mem: 94613168839420, value: 0x00 mem: 94613168839419, value: 0x00 mem: 94613168839418, value: 0x00 mem: 94613168839417, value: 0x00 mem: 94613168839416, value: 0x00 mem: 94613168839415, value: 0x00 mem: 94613168839414, value: 0x00 mem: 94613168839413, value: 0x00 mem: 94613168839412, value: 0x00 mem: 94613168839411, value: 0x00 mem: 94613168839410, value: 0x00 mem: 94613168839409, value: 0x00 mem: 94613168839408, value: 0x00 mem: 94613168839407, value: 0x00 mem: 94613168839406, value: 0x00 mem: 94613168839405, value: 0x00 mem: 94613168839404, value: 0x00 mem: 94613168839403, value: 0x00 mem: 94613168839402, value: 0x00 mem: 94613168839401, value: 0x00 mem: 94613168839400, value: 0x00 mem: 94613168839399, value: 0x00 mem: 94613168839398, value: 0x00 mem: 94613168839397, value: 0x00 mem: 94613168839396, value: 0x00 mem: 94613168839395, value: 0x00 mem: 94613168839394, value: 0x00 mem: 94613168839393, value: 0x00 mem: 94613168839392, value: 0x00 I LOVE WAKING UP ON A NEW STACK!
u64
, , ( — .).
, , , , 94613168839392
94613168839439
.
94613168839424
94613168839431
. — stack pointer
, , %rsp%
. , . ( — !!!)
0xB0, 0x50, 0x0B, 0xD8, 0x0C, 0x56, 0x00, 0x00
— ( ) hello()
, u8
.
, , 48 , , , .
, 8 , . , , , . " " (stack overflow), .
, , . 8 , , , -. , , , , , .
(growable — ) . , . , , , , .
Go. 8 , , . , , , . , GO ( ), .
, : (Vec<u8>
) . , . , , .
, , - , . - ,push()
( — .) . , , .
, , . , .
Windows x86-64 , x86-64 psABI. Windows , , , , , .
psABI :
, %rsp
— . , , base pointer, 16. 8 , , , . , - .
, stack_ptr + SSIZE - 16
, . - SSIZE
— .
. , ( — ) 8 . , rsp
16 , ABI.
- , stack_ptr + SSIZE - 16
. :
- ,
stack_ptr + SSIZE
( 16 ), .. , . - ,
stack_ptr + SSIZE - 8
, , 16 .
stack_ptr + SSIZE - 16
. 8 -16, -15, -14, ..., -9
(, , bottom of stack, .. ( — , , — , )).
, , , .
, , , .
, , 1024 , , . .
, , . : BEFORE.txt
( ) AFTER.txt
( ). , .
- , — .
#![feature(llvm_asm)]
#![feature(naked_functions)]
use std::io::Write;
const SSIZE: isize = 1024;
static mut S_PTR: *const u8 = 0 as *const u8;
#[derive(Debug, Default)]
#[repr(C)]
struct ThreadContext {
rsp: u64,
r15: u64,
r14: u64,
r13: u64,
r12: u64,
rbx: u64,
rbp: u64,
}
fn print_stack(filename: &str) {
let mut f = std::fs::File::create(filename).unwrap();
unsafe {
for i in (0..SSIZE).rev() {
writeln!(
f,
"mem: {}, val: {}",
S_PTR.offset(i as isize) as usize,
*S_PTR.offset( i as isize)
)
.expect("Error writing to file.");
}
}
}
fn hello() {
println!("I LOVE WAKING UP ON A NEW STACK!");
print_stack("AFTER.txt");
loop {}
}
unsafe fn gt_switch(new: *const ThreadContext) {
llvm_asm!("
mov 0x00($0), %rsp
ret
"
:
: "r"(new)
:
: "alignstack"
);
}
fn main() {
let mut ctx = ThreadContext::default();
let mut stack = vec![0_u8; SSIZE as usize];
let stack_ptr = stack.as_mut_ptr();
unsafe {
S_PTR = stack_ptr;
std::ptr::write(stack_ptr.offset(SSIZE - 16) as *mut u64, hello as u64);
print_stack("BEFORE.txt");
ctx.rsp = stack_ptr.offset(SSIZE - 16) as u64;
gt_switch(&mut ctx);
}
}
, , , , , , " " (best practicies) . , , , - , , , PR .
, — main.rs
, , :
#![feature(llvm_asm)]
#![feature(naked_functions)]
use std::ptr;
const DEFAULT_STACK_SIZE: usize = 1024 * 1024 * 2;
const MAX_THREADS: usize = 4;
static mut RUNTIME: usize = 0;
: asm
naked_functions
, .
naked_functions
, "" "", - , . , , . #[naked]
. .
,naked_functions
RFC #1201.
Naked- . , , , .. naked- .ret
naked- ( , ABI), . .
DEFAULT_STACK_SIZE
2 , , . (MAX_THREADS
) 4, .. .
— RUNTIME
— , (, , , , ).
- :
pub struct Runtime {
threads: Vec<Thread>,
current: usize,
}
#[derive(Debug, Eq, PartialEq)]
enum State {
Available,
Running,
Ready,
}
struct Thread {
id: usize,
stack: Vec<u8>,
ctx: ThreadContext,
state: State,
}
#[derive(Debug, Default)]
#[repr(C)]
struct ThreadContext {
rps: u64,
r15: u64,
r14, u64,
r13: u64,
r12: u64,
rbx: u64,
rbp: u64,
}
Runtime
. , . Thread
current
, , .
Thread
. , , id
. stack
, . ctx
, , . state
— .
State
— , :
Available
— , .Running
—Ready
— .
ThreadContext
, .
, " " , . x86-64 "callee saved".
:
impl Thread {
fn new(id: usize) -> Self {
Thread {
id,
stack: vec![0_u8; DEFAULT_STACK_SIZE],
ctx: ThreadContext::default(),
state: State::Available,
}
}
}
. Available
, , .
, . , .. . , , .
, , , .push()
, . , .
,Vec<T>
into_boxed_slice()
,Box<[T]>
— , . , .
impl Runtime
, .
impl Runtime {
pub fn new() -> Self {
let base_thread = Thread {
id: 0,
stack: vec![0_u8; DEFAULT_STACK_SIZE],
ctx: ThreadContext::default(),
state: State::Running,
};
let mut threads = vec![base_thread];
let mut available_threads: Vec<Thread> = (1..MAX_THREADS).map(|i| Thread::new(i)).collect();
threads.append(&mut available_threads);
Runtime {
threads,
current: 0,
}
}
// code of other methods is here
// ...
}
Runtime
Running
. . , 0
, .
// , Runtime
// , yield
// .
//
pub fn init(&self) {
unsafe {
let r_ptr: *const Runtime = self;
RUNTIME = r_ptr as usize;
}
}
. , , , yield
. , , , .
pub fn run(&mut self) -> ! {
while self.t_yield() {};
std::process::exit(0);
}
, . t_yield()
, false
, , , .
fn t_return(&mut self) {
if self.current != 0 {
std.threads[self.current].state = State::Available;
self.t_yield();
}
}
, . t_return
, .. return
. , — , , .
, . yield
. (spawned) , , , .. guard
( ). , t_return
— guard
.
Available
, , (task), t_yield
, .
yield
:
fn t_yield(&mut self) -> bool {
let mut post = self.current;
while self.threads[pos].state != State::Ready {
pos += 1;
if pos == self.threads.len() {
pos = 0;
}
if pos == self.current {
return false;
}
}
if self.threads[self.current].state != State::Available {
self.threads[self.current].state = State::Ready;
}
self.threads[pos].state = State::Running;
let old_pos = self.current;
self.current = pos;
unsafe {
let old: *mut ThreadContext = &mut self.threads[old_pos].ctx;
let new: *const ThreadContext = &self.threads[pos].ctx;
llvm_asm!(
"
mov $0, %rdi
mov $1, %rsi
"
:
: "r"(old), "r"(new)
:
:
);
switch();
}
self.threads.len() > 0
}
. t_yield
, .. yield
(. — , ).
, - Ready
, , , . , .
Ready
, . , (round-robin). , .
. , (Ready
) -, , ?
. , , (poll) . ,IsReady
, ,Pending
, - .Ready
, . ? , , , .
, , Running
Ready
.
switch
, . , , .
naked
naked . , . , , , . ,#[naked]
, . "" ""ThreadContext
, . Linux%rdi
, —%rsi
.
self.threads.len() > 0
— , . Windows, Linux, , . std::hint::black_box
, , , , . , , . , .
spawn()
:
pub fn spawn(&mut self, f: fn()) {
let available = self
.threads
.iter_mut()
.find(|t| t.state == State::Available)
.expect("no available thread.");
let size == available.stack.len();
unsafe {
let s_ptr = available.stack.as_mut_ptr().offset(size as isize);
let s_ptr = (s_ptr as usize & !15) as *mut u8;
std::ptr::write(s_ptr.offset(-16) as *mut u64, guard as u64);
std::ptr::write(s_ptr.offset(-24) as *mut u64, skip as u64);
std::ptr::write(s_ptr.offset(-32) as *mut u64, f as u64);
available.ctx.rsp = s_ptr.offset(-32) as u64;
}
available.state = State::Ready;
}
// `impl Runtime`
, t_yield
, spawn
.
, , , , , psABI.
, , (.. Available
). , , , , . .
, ( u8
) .
unsafe-. , 16 . guard
, , . skip
, , f
, guard
16 . , , f
.
, . ,f
, . base pointer .skip
guard
.guard
16 , ABI.
, , rsp
( ) . .
, Ready
, , , . , "" .
. , , . , , .
guard
, skip
switch
fn guard() {
unsafe {
let rt_ptr = RUNTIME as *mut Runtime;
(*rt_ptr).t_return();
};
}
, , , , , , t_return()
. , , , , t_return
, . Available
( ), t_yield
, .
#[naked]
fn skip() { }
skip
. #[naked]
, ret
, , . , guard
.
pub fn yield_thread() {
unsafe {
let rt_ptr = RUNTIME as *mut Runtime;
(*rt_ptr).t_yield();
};
}
, t_yield
. , , (), . , , .
, . , .
#[naked]
#[inline(never)]
unsafe fn switch() {
llvm_asm!("
mov %rsp, 0x00(%rdi)
mov %r15, 0x08(%rdi)
mov %r14, 0x10(%rdi)
mov %r13, 0x18(%rdi)
mov %r12, 0x20(%rdi)
mov %rbx, 0x28(%rdi)
mov %rbp, 0x30(%rdi)
mov 0x00(%rsi), %rsp
mov 0x08(%rsi), %r15
mov 0x10(%rsi), %r14
mov 0x18(%rsi), %r13
mov 0x20(%rsi), %r12
mov 0x28(%rsi), %rbx
mov 0x30(%rsi), %rbp
"
);
}
. , , , , , "" .
, , .
#[naked]
. , , , . , .
. #[inline(never)]
, . , , --release
.
main
fn main() {
let mut runtime = Runtime::new();
runtime.init();
runtime.spawn(|| {
println!("THREAD 1 STARTING");
let id = 1;
for i in 1..=10 {
println!("thread: {} counter: {}", id, i);
yield_thread();
}
println!("THREAD 1 FINISHED");
});
runtime.spawn(|| {
println!("THREAD 2 STARTING");
let id = 2;
for i in 1..=15 {
println!("thread: {} counter: {}", id i);
yield_thread();
}
println!("THREAD 2 FINISHED");
});
runtime.run();
}
, , 0 9 15, . cargo run
, :
THREAD 1 STARTING thread: 1 counter: 1 THREAD 2 STARTING thread: 2 counter: 1 thread: 1 counter: 2 thread: 2 counter: 2 thread: 1 counter: 3 thread: 2 counter: 3 thread: 1 counter: 4 thread: 2 counter: 4 thread: 1 counter: 5 thread: 2 counter: 5 thread: 1 counter: 6 thread: 2 counter: 6 thread: 1 counter: 7 thread: 2 counter: 7 thread: 1 counter: 8 thread: 2 counter: 8 thread: 1 counter: 9 thread: 2 counter: 9 thread: 1 counter: 10 thread: 2 counter: 10 THREAD 1 FINISHED thread: 2 counter: 11 thread: 2 counter: 12 thread: 2 counter: 13 thread: 2 counter: 14 thread: 2 counter: 15 THREAD 2 FINISHED
. , . 1 , 2 .
, . , , . !