Merge commit 'fba00e5d3404e1bcfe1007ee2e3bfc3b3bb888af' into update-subtrees

This commit is contained in:
Tim Allen 2021-08-01 09:46:29 +10:00
commit 139a44b142
10 changed files with 321 additions and 6 deletions

4
libco/doc/examples/.gitignore vendored Normal file
View file

@ -0,0 +1,4 @@
test_args
test_serialization
test_timing
*.o

8
libco/doc/examples/build.bat Executable file
View file

@ -0,0 +1,8 @@
cc -O3 -fomit-frame-pointer -I../.. -o libco.o -c ../../libco.c
c++ -O3 -fomit-frame-pointer -I../.. -c test_timing.cpp
c++ -O3 -fomit-frame-pointer -o test_timing libco.o test_timing.o
c++ -O3 -fomit-frame-pointer -I../.. -c test_args.cpp
c++ -O3 -fomit-frame-pointer -o test_args libco.o test_args.o
c++ -O3 -fomit-frame-pointer -I../.. -c test_serialization.cpp
c++ -O3 -fomit-frame-pointer -o test_serialization libco.o test_serialization.o
@del *.o

8
libco/doc/examples/build.sh Executable file
View file

@ -0,0 +1,8 @@
cc -O3 -fomit-frame-pointer -I../.. -o libco.o -c ../../libco.c
c++ -O3 -fomit-frame-pointer -I../.. -c test_timing.cpp
c++ -O3 -fomit-frame-pointer -o test_timing libco.o test_timing.o
c++ -O3 -fomit-frame-pointer -I../.. -c test_args.cpp
c++ -O3 -fomit-frame-pointer -o test_args libco.o test_args.o
c++ -O3 -fomit-frame-pointer -I../.. -c test_serialization.cpp
c++ -O3 -fomit-frame-pointer -o test_serialization libco.o test_serialization.o
rm -f *.o

View file

@ -0,0 +1,6 @@
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <time.h>
#include <libco.h>

View file

@ -0,0 +1,76 @@
/*****
* cothread parameterized function example
*****
* entry point to cothreads cannot take arguments.
* this is due to portability issues: each processor,
* operating system, programming language and compiler
* can use different parameter passing methods, so
* arguments to the cothread entry points were omitted.
*
* however, the behavior can easily be simulated by use
* of a specialized co_switch to set global parameters to
* be used as function arguments.
*
* in this way, with a bit of extra red tape, one gains
* even more flexibility than would be possible with a
* fixed argument list entry point, such as void (*)(void*),
* as any number of arguments can be used.
*
* this also eliminates race conditions where a pointer
* passed to co_create may have changed or become invalidated
* before call to co_switch, as said pointer would now be set
* when calling co_switch, instead.
*****/
#include "test.h"
cothread_t thread[3];
namespace co_arg {
int param_x;
int param_y;
};
//one could also call this co_init or somesuch if they preferred ...
void co_switch(cothread_t thread, int param_x, int param_y) {
co_arg::param_x = param_x;
co_arg::param_y = param_y;
co_switch(thread);
}
void co_entrypoint() {
int param_x = co_arg::param_x;
int param_y = co_arg::param_y;
printf("co_entrypoint(%d, %d)\n", param_x, param_y);
co_switch(thread[0]);
//co_arg::param_x will change here (due to co_switch(cothread_t, int, int) call changing values),
//however, param_x and param_y will persist as they are thread local
printf("co_entrypoint(%d, %d)\n", param_x, param_y);
co_switch(thread[0]);
throw;
}
int main() {
printf("cothread parameterized function example\n\n");
thread[0] = co_active();
thread[1] = co_create(65536, co_entrypoint);
thread[2] = co_create(65536, co_entrypoint);
//use specialized co_switch(cothread_t, int, int) for initial co_switch call
co_switch(thread[1], 1, 2);
co_switch(thread[2], 4, 8);
//after first call, entry point arguments have been initialized, standard
//co_switch(cothread_t) can be used from now on
co_switch(thread[2]);
co_switch(thread[1]);
printf("\ndone\n");
#if defined(_MSC_VER) || defined(__DJGPP__)
getch();
#endif
return 0;
}

View file

@ -0,0 +1,117 @@
#include "test.h"
#include <stdint.h>
#include <sys/mman.h>
namespace Thread {
cothread_t host;
cothread_t cpu;
cothread_t apu;
}
namespace Buffer {
uint8_t cpu[65536];
uint8_t apu[65536];
}
namespace Memory {
uint8_t* buffer;
}
struct CPU {
static auto Enter() -> void;
auto main() -> void;
auto sub() -> void;
auto leaf() -> void;
} cpu;
struct APU {
static auto Enter() -> void;
auto main() -> void;
auto sub() -> void;
auto leaf() -> void;
} apu;
auto CPU::Enter() -> void {
while(true) cpu.main();
}
auto CPU::main() -> void {
printf("2\n");
sub();
}
auto CPU::sub() -> void {
co_switch(Thread::apu);
printf("4\n");
leaf();
}
auto CPU::leaf() -> void {
int x = 42;
co_switch(Thread::host);
printf("6\n");
co_switch(Thread::apu);
printf("8 (%d)\n", x);
co_switch(Thread::host);
}
auto APU::Enter() -> void {
while(true) apu.main();
}
auto APU::main() -> void {
printf("3\n");
sub();
}
auto APU::sub() -> void {
co_switch(Thread::cpu);
printf("7\n");
leaf();
}
auto APU::leaf() -> void {
co_switch(Thread::cpu);
}
auto main() -> int {
if(!co_serializable()) {
printf("This implementation does not support serialization\n");
return 1;
}
Memory::buffer = (uint8_t*)mmap(
(void*)0x10'0000'0000, 2 * 65536,
PROT_READ | PROT_WRITE | PROT_EXEC,
MAP_FIXED | MAP_PRIVATE | MAP_ANONYMOUS, -1, 0
);
Memory::buffer[0] = 42;
printf("%p (%u)\n", Memory::buffer, Memory::buffer[0]);
Thread::host = co_active();
Thread::cpu = co_derive((void*)(Memory::buffer + 0 * 65536), 65536, CPU::Enter);
Thread::apu = co_derive((void*)(Memory::buffer + 1 * 65536), 65536, APU::Enter);
printf("1\n");
co_switch(Thread::cpu);
printf("5\n");
memcpy(Buffer::cpu, Thread::cpu, 65536);
memcpy(Buffer::apu, Thread::apu, 65536);
co_switch(Thread::cpu);
Thread::cpu = nullptr;
Thread::apu = nullptr;
Thread::cpu = co_derive((void*)(Memory::buffer + 0 * 65536), 65536, CPU::Enter);
Thread::apu = co_derive((void*)(Memory::buffer + 1 * 65536), 65536, APU::Enter);
printf("9\n");
memcpy(Thread::cpu, Buffer::cpu, 65536);
memcpy(Thread::apu, Buffer::apu, 65536);
co_switch(Thread::cpu);
Thread::cpu = nullptr;
Thread::apu = nullptr;
munmap((void*)0x900000000, 2 * 65536);
return 0;
}

View file

@ -0,0 +1,52 @@
#include "test.h"
enum { Iterations = 500000000 };
namespace thread {
cothread_t x;
cothread_t y;
volatile int counter;
}
void co_timingtest() {
for(;;) {
thread::counter++;
co_switch(thread::x);
}
}
void sub_timingtest() {
thread::counter++;
}
int main() {
printf("context-switching timing test\n\n");
time_t start, end;
int i, t1, t2;
start = clock();
for(thread::counter = 0, i = 0; i < Iterations; i++) {
sub_timingtest();
}
end = clock();
t1 = (int)difftime(end, start);
printf("%2.3f seconds per 50 million subroutine calls (%d iterations)\n", (float)t1 / CLOCKS_PER_SEC, thread::counter);
thread::x = co_active();
thread::y = co_create(65536, co_timingtest);
start = clock();
for(thread::counter = 0, i = 0; i < Iterations; i++) {
co_switch(thread::y);
}
end = clock();
co_delete(thread::y);
t2 = (int)difftime(end, start);
printf("%2.3f seconds per 100 million co_switch calls (%d iterations)\n", (float)t2 / CLOCKS_PER_SEC, thread::counter);
printf("co_switch skew = %fx\n\n", (double)t2 / (double)t1);
return 0;
}

View file

@ -9,7 +9,7 @@ C function call.
## libco.x86
* **Overhead:** ~5x
* **Supported processor(s):** 32-bit x86
*** Supported compiler(s**): any
* **Supported compiler(s):** any
* **Supported operating system(s):**
* Windows
* Mac OS X
@ -19,7 +19,7 @@ C function call.
## libco.amd64
* **Overhead:** ~10x (Windows), ~6x (all other platforms)
* **Supported processor(s):** 64-bit amd64
*** Supported compiler(s**): any
* **Supported compiler(s):** any
* **Supported operating system(s):**
* Windows
* Mac OS X

View file

@ -54,7 +54,9 @@ Handle to cothread.
Handle must be of type `void*`.
A value of `null` (0) indicates an uninitialized or invalid handle, whereas a non-zero value indicates a valid handle.
A value of null (0) indicates an uninitialized or invalid handle, whereas a
non-zero value indicates a valid handle. A valid handle is backed by execution
state to which the execution can be co_switch()ed to.
## co_active
```c
@ -62,7 +64,12 @@ cothread_t co_active();
```
Return handle to current cothread.
Always returns a valid handle, even when called from the main program thread.
Note that the handle is valid even if the function is called from a non-cothread
context. To achieve this, we save the execution state in an internal buffer,
instead of using the user-provided memory. Since this handle is valid, it can
be used to co_switch to this context from another cothread. In multi-threaded
applications, make sure to not switch non-cothread context across CPU cores,
to prevent any possible conflicts with the OS scheduler.
## co_derive
```c
@ -119,6 +126,19 @@ Passing handle of active cothread to this function is not allowed.
Passing handle of primary cothread is not allowed.
## co_serializable
```c
int co_serializable(void);
```
Returns non-zero if the implementation keeps the entire coroutine state in the
buffer passed to `co_derive()`. That is, if `co_serializable()` returns
non-zero, and if your cothread does not modify the heap or any process-wide
state, then you can "snapshot" the cothread's state by taking a copy of the
buffer originally passed to `co_derive()`, and "restore" a previous state
by copying the snapshot back into the buffer it came from.
## co_switch
```c
void co_switch(cothread_t cothread);

View file

@ -14,7 +14,7 @@
#if !defined(LIBCO_MP) /* Running in single-threaded environment */
#define thread_local
#else /* Running in multi-threaded environment */
#if defined(__STDC_VERSION__) /* Compiling as C Language */
#if defined(__STDC__) /* Compiling as C Language */
#if defined(_MSC_VER) /* Don't rely on MSVC's C11 support */
#define thread_local __declspec(thread)
#elif __STDC_VERSION__ < 201112L /* If we are on C90/99 */
@ -55,7 +55,7 @@
- alignas (TYPE) is equivalent to alignas (alignof (TYPE)).
*/
#if !defined(alignas)
#if defined(__STDC_VERSION__) /* C Language */
#if defined(__STDC__) /* C Language */
#if defined(_MSC_VER) /* Don't rely on MSVC's C11 support */
#define alignas(bytes) __declspec(align(bytes))
#elif __STDC_VERSION__ >= 201112L /* C11 and above */
@ -85,6 +85,30 @@
#define LIBCO_ASSERT assert
#endif
#if defined (__OpenBSD__)
#if !defined(LIBCO_MALLOC) || !defined(LIBCO_FREE)
#include <unistd.h>
#include <sys/mman.h>
static void* malloc_obsd(size_t size) {
long pagesize = sysconf(_SC_PAGESIZE);
char* memory = (char*)mmap(NULL, size + pagesize, PROT_READ|PROT_WRITE, MAP_STACK|MAP_PRIVATE|MAP_ANON, -1, 0);
if (memory == MAP_FAILED) return NULL;
*(size_t*)memory = size + pagesize;
memory += pagesize;
return (void*)memory;
}
static void free_obsd(void *ptr) {
char* memory = (char*)ptr - sysconf(_SC_PAGESIZE);
munmap(memory, *(size_t*)memory);
}
#define LIBCO_MALLOC malloc_obsd
#define LIBCO_FREE free_obsd
#endif
#endif
#if !defined(LIBCO_MALLOC) || !defined(LIBCO_FREE)
#include <stdlib.h>
#define LIBCO_MALLOC malloc