| 1 | /* |
| 2 | * Copyright (c) 2001-2012,2015 Marc Alexander Lehmann <schmorp@schmorp.de> |
| 3 | * |
| 4 | * Redistribution and use in source and binary forms, with or without modifica- |
| 5 | * tion, are permitted provided that the following conditions are met: |
| 6 | * |
| 7 | * 1. Redistributions of source code must retain the above copyright notice, |
| 8 | * this list of conditions and the following disclaimer. |
| 9 | * |
| 10 | * 2. Redistributions in binary form must reproduce the above copyright |
| 11 | * notice, this list of conditions and the following disclaimer in the |
| 12 | * documentation and/or other materials provided with the distribution. |
| 13 | * |
| 14 | * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR IMPLIED |
| 15 | * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MER- |
| 16 | * CHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO |
| 17 | * EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPE- |
| 18 | * CIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, |
| 19 | * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; |
| 20 | * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, |
| 21 | * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTH- |
| 22 | * ERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED |
| 23 | * OF THE POSSIBILITY OF SUCH DAMAGE. |
| 24 | * |
| 25 | * Alternatively, the contents of this file may be used under the terms of |
| 26 | * the GNU General Public License ("GPL") version 2 or any later version, |
| 27 | * in which case the provisions of the GPL are applicable instead of |
| 28 | * the above. If you wish to allow the use of your version of this file |
| 29 | * only under the terms of the GPL and not to allow others to use your |
| 30 | * version of this file under the BSD license, indicate your decision |
| 31 | * by deleting the provisions above and replace them with the notice |
| 32 | * and other provisions required by the GPL. If you do not delete the |
| 33 | * provisions above, a recipient may use your version of this file under |
| 34 | * either the BSD or the GPL. |
| 35 | * |
| 36 | * This library is modelled strictly after Ralf S. Engelschalls article at |
| 37 | * http://www.gnu.org/software/pth/rse-pmt.ps. So most of the credit must |
| 38 | * go to Ralf S. Engelschall <rse@engelschall.com>. |
| 39 | * |
| 40 | * This coroutine library is very much stripped down. You should either |
| 41 | * build your own process abstraction using it or - better - just use GNU |
| 42 | * Portable Threads, http://www.gnu.org/software/pth/. |
| 43 | * |
| 44 | */ |
| 45 | |
| 46 | /* |
| 47 | * 2006-10-26 Include stddef.h on OS X to work around one of its bugs. |
| 48 | * Reported by Michael_G_Schwern. |
| 49 | * 2006-11-26 Use _setjmp instead of setjmp on GNU/Linux. |
| 50 | * 2007-04-27 Set unwind frame info if gcc 3+ and ELF is detected. |
| 51 | * Use _setjmp instead of setjmp on _XOPEN_SOURCE >= 600. |
| 52 | * 2007-05-02 Add assembly versions for x86 and amd64 (to avoid reliance |
| 53 | * on SIGUSR2 and sigaltstack in Crossfire). |
| 54 | * 2008-01-21 Disable CFI usage on anything but GNU/Linux. |
| 55 | * 2008-03-02 Switched to 2-clause BSD license with GPL exception. |
| 56 | * 2008-04-04 New (but highly unrecommended) pthreads backend. |
| 57 | * 2008-04-24 Reinstate CORO_LOSER (had wrong stack adjustments). |
| 58 | * 2008-10-30 Support assembly method on x86 with and without frame pointer. |
| 59 | * 2008-11-03 Use a global asm statement for CORO_ASM, idea by pippijn. |
| 60 | * 2008-11-05 Hopefully fix misaligned stacks with CORO_ASM/SETJMP. |
| 61 | * 2008-11-07 rbp wasn't saved in CORO_ASM on x86_64. |
| 62 | * introduce coro_destroy, which is a nop except for pthreads. |
| 63 | * speed up CORO_PTHREAD. Do no longer leak threads either. |
| 64 | * coro_create now allows one to create source coro_contexts. |
| 65 | * do not rely on makecontext passing a void * correctly. |
| 66 | * try harder to get _setjmp/_longjmp. |
| 67 | * major code cleanup/restructuring. |
| 68 | * 2008-11-10 the .cfi hacks are no longer needed. |
| 69 | * 2008-11-16 work around a freebsd pthread bug. |
| 70 | * 2008-11-19 define coro_*jmp symbols for easier porting. |
| 71 | * 2009-06-23 tentative win32-backend support for mingw32 (Yasuhiro Matsumoto). |
| 72 | * 2010-12-03 tentative support for uclibc (which lacks all sorts of things). |
| 73 | * 2011-05-30 set initial callee-saved-registers to zero with CORO_ASM. |
| 74 | * use .cfi_undefined rip on linux-amd64 for better backtraces. |
| 75 | * 2011-06-08 maybe properly implement weird windows amd64 calling conventions. |
| 76 | * 2011-07-03 rely on __GCC_HAVE_DWARF2_CFI_ASM for cfi detection. |
| 77 | * 2011-08-08 cygwin trashes stacks, use pthreads with double stack on cygwin. |
| 78 | * 2012-12-04 reduce misprediction penalty for x86/amd64 assembly switcher. |
| 79 | * 2012-12-05 experimental fiber backend (allocates stack twice). |
| 80 | * 2012-12-07 API version 3 - add coro_stack_alloc/coro_stack_free. |
| 81 | * 2012-12-21 valgrind stack registering was broken. |
| 82 | * 2015-12-05 experimental asm be for arm7, based on a patch by Nick Zavaritsky. |
| 83 | * use __name__ for predefined symbols, as in libecb. |
| 84 | * enable guard pages on arm, aarch64 and mips. |
| 85 | */ |
| 86 | |
| 87 | #ifndef CORO_H |
| 88 | #define CORO_H |
| 89 | |
| 90 | #if __cplusplus |
| 91 | extern "C" { |
| 92 | #endif |
| 93 | |
| 94 | /* |
| 95 | * This library consists of only three files |
| 96 | * coro.h, coro.c and LICENSE (and optionally README) |
| 97 | * |
| 98 | * It implements what is known as coroutines, in a hopefully |
| 99 | * portable way. |
| 100 | * |
| 101 | * All compiletime symbols must be defined both when including coro.h |
| 102 | * (using libcoro) as well as when compiling coro.c (the implementation). |
| 103 | * |
| 104 | * You can manually specify which flavour you want. If you don't define |
| 105 | * any of these, libcoro tries to choose a safe and fast default: |
| 106 | * |
| 107 | * -DCORO_UCONTEXT |
| 108 | * |
| 109 | * This flavour uses SUSv2's get/set/swap/makecontext functions that |
| 110 | * unfortunately only some unices support, and is quite slow. |
| 111 | * |
| 112 | * -DCORO_SJLJ |
| 113 | * |
| 114 | * This flavour uses SUSv2's setjmp/longjmp and sigaltstack functions to |
| 115 | * do it's job. Coroutine creation is much slower than UCONTEXT, but |
| 116 | * context switching is a bit cheaper. It should work on almost all unices. |
| 117 | * |
| 118 | * -DCORO_LINUX |
| 119 | * |
| 120 | * CORO_SJLJ variant. |
| 121 | * Old GNU/Linux systems (<= glibc-2.1) only work with this implementation |
| 122 | * (it is very fast and therefore recommended over other methods, but |
| 123 | * doesn't work with anything newer). |
| 124 | * |
| 125 | * -DCORO_LOSER |
| 126 | * |
| 127 | * CORO_SJLJ variant. |
| 128 | * Microsoft's highly proprietary platform doesn't support sigaltstack, and |
| 129 | * this selects a suitable workaround for this platform. It might not work |
| 130 | * with your compiler though - it has only been tested with MSVC 6. |
| 131 | * |
| 132 | * -DCORO_FIBER |
| 133 | * |
| 134 | * Slower, but probably more portable variant for the Microsoft operating |
| 135 | * system, using fibers. Ignores the passed stack and allocates it internally. |
| 136 | * Also, due to bugs in cygwin, this does not work with cygwin. |
| 137 | * |
| 138 | * -DCORO_IRIX |
| 139 | * |
| 140 | * CORO_SJLJ variant. |
| 141 | * For SGI's version of Microsoft's NT ;) |
| 142 | * |
| 143 | * -DCORO_ASM |
| 144 | * |
| 145 | * Hand coded assembly, known to work only on a few architectures/ABI: |
| 146 | * GCC + arm7/x86/IA32/amd64/x86_64 + GNU/Linux and a few BSDs. Fastest |
| 147 | * choice, if it works. |
| 148 | * |
| 149 | * -DCORO_PTHREAD |
| 150 | * |
| 151 | * Use the pthread API. You have to provide <pthread.h> and -lpthread. |
| 152 | * This is likely the slowest backend, and it also does not support fork(), |
| 153 | * so avoid it at all costs. |
| 154 | * |
| 155 | * If you define neither of these symbols, coro.h will try to autodetect |
| 156 | * the best/safest model. To help with the autodetection, you should check |
| 157 | * (e.g. using autoconf) and define the following symbols: HAVE_UCONTEXT_H |
| 158 | * / HAVE_SETJMP_H / HAVE_SIGALTSTACK. |
| 159 | */ |
| 160 | |
| 161 | /* |
| 162 | * Changes when the API changes incompatibly. |
| 163 | * This is ONLY the API version - there is no ABI compatibility between releases. |
| 164 | * |
| 165 | * Changes in API version 2: |
| 166 | * replaced bogus -DCORO_LOOSE with grammatically more correct -DCORO_LOSER |
| 167 | * Changes in API version 3: |
| 168 | * introduced stack management (CORO_STACKALLOC) |
| 169 | */ |
| 170 | #define CORO_VERSION 3 |
| 171 | |
| 172 | #include <stddef.h> |
| 173 | |
| 174 | /* |
| 175 | * This is the type for the initialization function of a new coroutine. |
| 176 | */ |
| 177 | typedef void (*coro_func)(void *); |
| 178 | |
| 179 | /* |
| 180 | * A coroutine state is saved in the following structure. Treat it as an |
| 181 | * opaque type. errno and sigmask might be saved, but don't rely on it, |
| 182 | * implement your own switching primitive if you need that. |
| 183 | */ |
| 184 | typedef struct coro_context coro_context; |
| 185 | |
| 186 | /* |
| 187 | * This function creates a new coroutine. Apart from a pointer to an |
| 188 | * uninitialised coro_context, it expects a pointer to the entry function |
| 189 | * and the single pointer value that is given to it as argument. |
| 190 | * |
| 191 | * Allocating/deallocating the stack is your own responsibility. |
| 192 | * |
| 193 | * As a special case, if coro, arg, sptr and ssze are all zero, |
| 194 | * then an "empty" coro_context will be created that is suitable |
| 195 | * as an initial source for coro_transfer. |
| 196 | * |
| 197 | * This function is not reentrant, but putting a mutex around it |
| 198 | * will work. |
| 199 | */ |
| 200 | void coro_create (coro_context *ctx, /* an uninitialised coro_context */ |
| 201 | coro_func coro, /* the coroutine code to be executed */ |
| 202 | void *arg, /* a single pointer passed to the coro */ |
| 203 | void *sptr, /* start of stack area */ |
| 204 | size_t ssze); /* size of stack area in bytes */ |
| 205 | |
| 206 | /* |
| 207 | * The following prototype defines the coroutine switching function. It is |
| 208 | * sometimes implemented as a macro, so watch out. |
| 209 | * |
| 210 | * This function is thread-safe and reentrant. |
| 211 | */ |
| 212 | #if 0 |
| 213 | void coro_transfer (coro_context *prev, coro_context *next); |
| 214 | #endif |
| 215 | |
| 216 | /* |
| 217 | * The following prototype defines the coroutine destroy function. It |
| 218 | * is sometimes implemented as a macro, so watch out. It also serves no |
| 219 | * purpose unless you want to use the CORO_PTHREAD backend, where it is |
| 220 | * used to clean up the thread. You are responsible for freeing the stack |
| 221 | * and the context itself. |
| 222 | * |
| 223 | * This function is thread-safe and reentrant. |
| 224 | */ |
| 225 | #if 0 |
| 226 | void coro_destroy (coro_context *ctx); |
| 227 | #endif |
| 228 | |
| 229 | /*****************************************************************************/ |
| 230 | /* optional stack management */ |
| 231 | /*****************************************************************************/ |
| 232 | /* |
| 233 | * You can disable all of the stack management functions by |
| 234 | * defining CORO_STACKALLOC to 0. Otherwise, they are enabled by default. |
| 235 | * |
| 236 | * If stack management is enabled, you can influence the implementation via these |
| 237 | * symbols: |
| 238 | * |
| 239 | * -DCORO_USE_VALGRIND |
| 240 | * |
| 241 | * If defined, then libcoro will include valgrind/valgrind.h and register |
| 242 | * and unregister stacks with valgrind. |
| 243 | * |
| 244 | * -DCORO_GUARDPAGES=n |
| 245 | * |
| 246 | * libcoro will try to use the specified number of guard pages to protect against |
| 247 | * stack overflow. If n is 0, then the feature will be disabled. If it isn't |
| 248 | * defined, then libcoro will choose a suitable default. If guardpages are not |
| 249 | * supported on the platform, then the feature will be silently disabled. |
| 250 | */ |
| 251 | #ifndef CORO_STACKALLOC |
| 252 | # define CORO_STACKALLOC 1 |
| 253 | #endif |
| 254 | |
| 255 | #if CORO_STACKALLOC |
| 256 | |
| 257 | /* |
| 258 | * The only allowed operations on these struct members is to read the |
| 259 | * "sptr" and "ssze" members to pass it to coro_create, to read the "sptr" |
| 260 | * member to see if it is false, in which case the stack isn't allocated, |
| 261 | * and to set the "sptr" member to 0, to indicate to coro_stack_free to |
| 262 | * not actually do anything. |
| 263 | */ |
| 264 | |
| 265 | struct coro_stack |
| 266 | { |
| 267 | void *sptr; |
| 268 | size_t ssze; |
| 269 | #if CORO_USE_VALGRIND |
| 270 | int valgrind_id; |
| 271 | #endif |
| 272 | }; |
| 273 | |
| 274 | /* |
| 275 | * Try to allocate a stack of at least the given size and return true if |
| 276 | * successful, or false otherwise. |
| 277 | * |
| 278 | * The size is *NOT* specified in bytes, but in units of sizeof (void *), |
| 279 | * i.e. the stack is typically 4(8) times larger on 32 bit(64 bit) platforms |
| 280 | * then the size passed in. |
| 281 | * |
| 282 | * If size is 0, then a "suitable" stack size is chosen (usually 1-2MB). |
| 283 | */ |
| 284 | int coro_stack_alloc (struct coro_stack *stack, unsigned int size); |
| 285 | |
| 286 | /* |
| 287 | * Free the stack allocated by coro_stack_alloc again. It is safe to |
| 288 | * call this function on the coro_stack structure even if coro_stack_alloc |
| 289 | * failed. |
| 290 | */ |
| 291 | void coro_stack_free (struct coro_stack *stack); |
| 292 | |
| 293 | #endif |
| 294 | |
| 295 | /* |
| 296 | * That was it. No other user-serviceable parts below here. |
| 297 | */ |
| 298 | |
| 299 | /*****************************************************************************/ |
| 300 | |
| 301 | #if !defined CORO_LOSER && !defined CORO_UCONTEXT \ |
| 302 | && !defined CORO_SJLJ && !defined CORO_LINUX \ |
| 303 | && !defined CORO_IRIX && !defined CORO_ASM \ |
| 304 | && !defined CORO_PTHREAD && !defined CORO_FIBER |
| 305 | # if defined WINDOWS && (defined __i386__ || (__x86_64__ || defined _M_IX86 || defined _M_AMD64)) |
| 306 | # define CORO_ASM 1 |
| 307 | # elif defined WINDOWS || defined _WIN32 |
| 308 | # define CORO_LOSER 1 /* you don't win with windoze */ |
| 309 | # elif __linux && (__i386__ || (__x86_64__ && !__ILP32__) || (__arm__ && __ARCH_ARCH == 7)) |
| 310 | # define CORO_ASM 1 |
| 311 | # elif defined HAVE_UCONTEXT_H |
| 312 | # define CORO_UCONTEXT 1 |
| 313 | # elif defined HAVE_SETJMP_H && defined HAVE_SIGALTSTACK |
| 314 | # define CORO_SJLJ 1 |
| 315 | # else |
| 316 | error unknown or unsupported architecture |
| 317 | # endif |
| 318 | #endif |
| 319 | |
| 320 | /*****************************************************************************/ |
| 321 | |
| 322 | #if CORO_UCONTEXT |
| 323 | |
| 324 | # include <ucontext.h> |
| 325 | |
| 326 | struct coro_context |
| 327 | { |
| 328 | ucontext_t uc; |
| 329 | }; |
| 330 | |
| 331 | # define coro_transfer(p,n) swapcontext (&((p)->uc), &((n)->uc)) |
| 332 | # define coro_destroy(ctx) (void *)(ctx) |
| 333 | |
| 334 | #elif CORO_SJLJ || CORO_LOSER || CORO_LINUX || CORO_IRIX |
| 335 | |
| 336 | # if defined(CORO_LINUX) && !defined(_GNU_SOURCE) |
| 337 | # define _GNU_SOURCE /* for glibc */ |
| 338 | # endif |
| 339 | |
| 340 | # if !CORO_LOSER |
| 341 | # include <unistd.h> |
| 342 | # endif |
| 343 | |
| 344 | /* solaris is hopelessly borked, it expands _XOPEN_UNIX to nothing */ |
| 345 | # if __sun |
| 346 | # undef _XOPEN_UNIX |
| 347 | # define _XOPEN_UNIX 1 |
| 348 | # endif |
| 349 | |
| 350 | # include <setjmp.h> |
| 351 | |
| 352 | # if _XOPEN_UNIX > 0 || defined (_setjmp) |
| 353 | # define coro_jmp_buf jmp_buf |
| 354 | # define coro_setjmp(env) _setjmp (env) |
| 355 | # define coro_longjmp(env) _longjmp ((env), 1) |
| 356 | # elif CORO_LOSER |
| 357 | # define coro_jmp_buf jmp_buf |
| 358 | # define coro_setjmp(env) setjmp (env) |
| 359 | # define coro_longjmp(env) longjmp ((env), 1) |
| 360 | # else |
| 361 | # define coro_jmp_buf sigjmp_buf |
| 362 | # define coro_setjmp(env) sigsetjmp (env, 0) |
| 363 | # define coro_longjmp(env) siglongjmp ((env), 1) |
| 364 | # endif |
| 365 | |
| 366 | struct coro_context |
| 367 | { |
| 368 | coro_jmp_buf env; |
| 369 | }; |
| 370 | |
| 371 | # define coro_transfer(p,n) do { if (!coro_setjmp ((p)->env)) coro_longjmp ((n)->env); } while (0) |
| 372 | # define coro_destroy(ctx) (void *)(ctx) |
| 373 | |
| 374 | #elif CORO_ASM |
| 375 | |
| 376 | struct coro_context |
| 377 | { |
| 378 | void **sp; /* must be at offset 0 */ |
| 379 | }; |
| 380 | |
| 381 | #if __i386__ || __x86_64__ |
| 382 | void __attribute__ ((__noinline__, __regparm__(2))) |
| 383 | #else |
| 384 | void __attribute__ ((__noinline__)) |
| 385 | #endif |
| 386 | coro_transfer (coro_context *prev, coro_context *next); |
| 387 | |
| 388 | # define coro_destroy(ctx) (void *)(ctx) |
| 389 | |
| 390 | #elif CORO_PTHREAD |
| 391 | |
| 392 | # include <pthread.h> |
| 393 | |
| 394 | extern pthread_mutex_t coro_mutex; |
| 395 | |
| 396 | struct coro_context |
| 397 | { |
| 398 | pthread_cond_t cv; |
| 399 | pthread_t id; |
| 400 | }; |
| 401 | |
| 402 | void coro_transfer (coro_context *prev, coro_context *next); |
| 403 | void coro_destroy (coro_context *ctx); |
| 404 | |
| 405 | #elif CORO_FIBER |
| 406 | |
| 407 | struct coro_context |
| 408 | { |
| 409 | void *fiber; |
| 410 | /* only used for initialisation */ |
| 411 | coro_func coro; |
| 412 | void *arg; |
| 413 | }; |
| 414 | |
| 415 | void coro_transfer (coro_context *prev, coro_context *next); |
| 416 | void coro_destroy (coro_context *ctx); |
| 417 | |
| 418 | #endif |
| 419 | |
| 420 | #if __cplusplus |
| 421 | } |
| 422 | #endif |
| 423 | |
| 424 | #endif |
| 425 | |
| 426 | |