mirror of
https://github.com/logos-messaging/nim-ffi.git
synced 2026-06-21 08:49:34 +00:00
190 lines
7.1 KiB
Nim
190 lines
7.1 KiB
Nim
## FFIContext type plus lifecycle (init / signal-stop / join / destroy).
|
|
##
|
|
## The per-thread bodies live in `ffi_thread.nim` and `event_thread.nim`,
|
|
## included below so the thread code can access the private FFIContext
|
|
## fields without forcing them through a public surface.
|
|
|
|
{.passc: "-fPIC".}
|
|
|
|
import std/[atomics, locks, options, tables]
|
|
import chronicles, chronos, chronos/threadsync, taskpools/channels_spsc_single, results
|
|
import ./ffi_types, ./ffi_events, ./ffi_thread_request, ./logging, ./cbor_serial
|
|
|
|
export ffi_events
|
|
|
|
type FFIContext*[T] = object
|
|
myLib*: ptr T # main library object (Waku, LibP2P, SDS, …)
|
|
ffiThread: Thread[(ptr FFIContext[T])]
|
|
eventThread: Thread[(ptr FFIContext[T])]
|
|
lock: Lock
|
|
reqChannel: ChannelSPSCSingle[ptr FFIThreadRequest]
|
|
reqSignal: ThreadSignalPtr
|
|
reqReceivedSignal: ThreadSignalPtr
|
|
stopSignal: ThreadSignalPtr
|
|
threadExitSignal: ThreadSignalPtr
|
|
# bounds destroyFFIContext's wait so a blocked loop cannot hang the caller
|
|
eventQueueSignal: ThreadSignalPtr # wakes the event thread on enqueue
|
|
eventThreadExitSignal: ThreadSignalPtr # mirrors threadExitSignal for the event thread
|
|
userData*: pointer
|
|
eventRegistry*: FFIEventRegistry
|
|
eventQueue*: EventQueue
|
|
ffiHeartbeat*: Atomic[int64]
|
|
# advanced each FFI-thread loop; event thread reads for liveness
|
|
eventQueueStuck*: Atomic[bool] # sticky overflow flag
|
|
running: Atomic[bool] # To control when the threads are running
|
|
registeredRequests: ptr Table[cstring, FFIRequestProc]
|
|
|
|
var onFFIThread* {.threadvar.}: bool
|
|
# Re-entrant dispatch guard for `sendRequestToFFIThread`.
|
|
|
|
const git_version* {.strdefine.} = "n/a"
|
|
|
|
const
|
|
EventThreadTickInterval* = 1.seconds
|
|
FFIHeartbeatStartDelay* = 10.seconds # grace window for library startup
|
|
FFIHeartbeatStaleThreshold* = 1.seconds
|
|
|
|
include ./event_thread
|
|
include ./ffi_thread
|
|
|
|
template closeAndNil(field: untyped) =
|
|
if not field.isNil():
|
|
?field.close()
|
|
field = nil
|
|
|
|
proc deinitContextResources*[T](ctx: ptr FFIContext[T]): Result[void, string] =
|
|
## Mirror of `initContextResources`. Threads MUST be joined first;
|
|
## fields are nil'd after close so re-init on the same slot is safe.
|
|
ctx.lock.deinitLock()
|
|
deinitEventRegistry(ctx[].eventRegistry)
|
|
deinitEventQueue(ctx[].eventQueue)
|
|
when defined(gcRefc):
|
|
# ThreadSignalPtr.close() under refc traps in safeUnregisterAndCloseFd
|
|
# → newDispatcher → rawNewObj → signal-handler re-entry (process hangs).
|
|
# See tests/test_ffi_context.nim "destroyFFIContext refc workaround".
|
|
# Fd leak is bounded — destroy runs once per process lifetime.
|
|
discard
|
|
else:
|
|
closeAndNil(ctx.reqSignal)
|
|
closeAndNil(ctx.reqReceivedSignal)
|
|
closeAndNil(ctx.stopSignal)
|
|
closeAndNil(ctx.threadExitSignal)
|
|
closeAndNil(ctx.eventQueueSignal)
|
|
closeAndNil(ctx.eventThreadExitSignal)
|
|
ok()
|
|
|
|
proc cleanUpResources[T](ctx: ptr FFIContext[T]): Result[void, string] =
|
|
## Deinit + free for heap-allocated contexts.
|
|
defer:
|
|
freeShared(ctx)
|
|
ctx.deinitContextResources()
|
|
|
|
template newSignalOrErr(field: untyped, name: string) =
|
|
field = ThreadSignalPtr.new().valueOr:
|
|
return err("couldn't create ThreadSignalPtr: " & name & ": " & $error)
|
|
|
|
proc initContextResources*[T](ctx: ptr FFIContext[T]): Result[void, string] =
|
|
## On failure, the deferred cleanup closes partial state; caller releases
|
|
## the slot (freeShared or pool.releaseSlot).
|
|
# Nil first so deferred cleanup can't double-close a reused pool slot.
|
|
ctx.reqSignal = nil
|
|
ctx.reqReceivedSignal = nil
|
|
ctx.stopSignal = nil
|
|
ctx.threadExitSignal = nil
|
|
ctx.eventQueueSignal = nil
|
|
ctx.eventThreadExitSignal = nil
|
|
ctx.lock.initLock()
|
|
initEventRegistry(ctx[].eventRegistry)
|
|
initEventQueue(ctx[].eventQueue)
|
|
ctx.ffiHeartbeat.store(0)
|
|
ctx.eventQueueStuck.store(false)
|
|
|
|
var success = false
|
|
defer:
|
|
if not success:
|
|
ctx.cleanUpResources().isOkOr:
|
|
error "failed to clean up resources after createFFIContext failure",
|
|
error = error
|
|
|
|
newSignalOrErr(ctx.reqSignal, "reqSignal")
|
|
newSignalOrErr(ctx.reqReceivedSignal, "reqReceivedSignal")
|
|
newSignalOrErr(ctx.stopSignal, "stopSignal")
|
|
newSignalOrErr(ctx.threadExitSignal, "threadExitSignal")
|
|
newSignalOrErr(ctx.eventQueueSignal, "eventQueueSignal")
|
|
newSignalOrErr(ctx.eventThreadExitSignal, "eventThreadExitSignal")
|
|
|
|
ctx.registeredRequests = addr ffi_types.registeredRequests
|
|
|
|
ctx.running.store(true)
|
|
|
|
try:
|
|
createThread(ctx.ffiThread, ffiThreadBody[T], ctx)
|
|
except ValueError, ResourceExhaustedError:
|
|
return err("failed to create the FFI thread: " & getCurrentExceptionMsg())
|
|
|
|
try:
|
|
createThread(ctx.eventThread, eventThreadBody[T], ctx)
|
|
except ValueError, ResourceExhaustedError:
|
|
# Join ffiThread before deferred cleanup closes signals it's waiting on.
|
|
ctx.running.store(false)
|
|
let fireRes = ctx.reqSignal.fireSync()
|
|
if fireRes.isErr():
|
|
error "failed to signal ffiThread during event-thread cleanup",
|
|
error = fireRes.error
|
|
joinThread(ctx.ffiThread)
|
|
return err("failed to create the event thread: " & getCurrentExceptionMsg())
|
|
|
|
success = true
|
|
ok()
|
|
|
|
proc fireOrErr(sig: ThreadSignalPtr, name: string): Result[void, string] =
|
|
let fired = sig.fireSync().valueOr:
|
|
return err("error signaling: " & name & ": " & $error)
|
|
if not fired:
|
|
return err("failed to signal: " & name & " on time")
|
|
ok()
|
|
|
|
proc waitExitOrErr(
|
|
sig: ThreadSignalPtr, name: string, timeout: Duration
|
|
): Result[void, string] =
|
|
let exited = sig.waitSync(timeout).valueOr:
|
|
return err("error waiting for exit: " & name & ": " & $error)
|
|
if not exited:
|
|
return err("did not exit in time: " & name & " (leaking ctx to avoid hang)")
|
|
ok()
|
|
|
|
proc signalStop*[T](ctx: ptr FFIContext[T]): Result[void, string] =
|
|
# Skip onNotResponding on error: it takes reg.lock, which a back-pressuring
|
|
# listener may hold — would deepen the stuck state into a deadlock.
|
|
ctx.running.store(false)
|
|
?ctx.reqSignal.fireOrErr("reqSignal")
|
|
?ctx.stopSignal.fireOrErr("stopSignal")
|
|
# Non-fatal: event thread sees running==false on the next tick anyway.
|
|
ctx.eventQueueSignal.fireOrErr("eventQueueSignal").isOkOr:
|
|
error "failed to signal eventQueueSignal in signalStop", error = error
|
|
ok()
|
|
|
|
## Bound on how long clearContext waits for the FFI thread to exit before
|
|
## leaking ctx rather than hanging the caller.
|
|
const ThreadExitTimeout* = 1500.milliseconds
|
|
|
|
proc stopAndJoinThreads*[T](ctx: ptr FFIContext[T]): Result[void, string] =
|
|
## On timeout, returns err and skips remaining joins (leaves threads live).
|
|
## Caller owns resource cleanup. Skips onNotResponding (same reason as signalStop).
|
|
ctx.signalStop().isOkOr:
|
|
return err("signalStop failed: " & $error)
|
|
|
|
?ctx.threadExitSignal.waitExitOrErr("FFI thread", ThreadExitTimeout)
|
|
joinThread(ctx.ffiThread)
|
|
?ctx.eventThreadExitSignal.waitExitOrErr("event thread", ThreadExitTimeout)
|
|
joinThread(ctx.eventThread)
|
|
ok()
|
|
|
|
proc clearContext[T](ctx: ptr FFIContext[T]): Result[void, string] =
|
|
## Stops a heap-allocated FFI context.
|
|
ctx.stopAndJoinThreads().isOkOr:
|
|
return err("clearContext: " & $error)
|
|
ctx.cleanUpResources().isOkOr:
|
|
return err("cleanUpResources failed: " & $error)
|
|
ok()
|