Add `.trionics._broadcast` todos for py 3.12

Start a `._rpc` module
Since `._runtime` was getting pretty long (> 2k LOC) and much of the RPC low-level machinery is fairly isolated to a handful of task-funcs, it makes sense to re-org the RPC task scheduling and driving msg loop to its own code space. The move includes: - `process_messages()` which is the main IPC business logic. - `try_ship_error_to_remote()` helper, to box local errors for the wire. - `_invoke()`, the core task scheduler entrypoing used in the msg loop. - `_invoke_non_context()`, holds impls for non-`@context` task starts. - `_errors_relayed_via_ipc()` which does all error catch-n-boxing for wire-msg shipment using `try_ship_error_to_remote()` internally. Also inside `._runtime` improve some `Actor` methods docs.
2024-03-13 16:09:31 -04:00 · 2024-03-13 15:57:15 -04:00 · 2024-03-13 12:09:38 -04:00 · 2024-03-13 10:44:51 -04:00 · 2024-03-13 09:09:08 -04:00 · 2024-03-12 08:56:17 -04:00
27 changed files with 1257 additions and 332 deletions
--- a/examples/advanced_faults/ipc_failure_during_stream.py
+++ b/examples/advanced_faults/ipc_failure_during_stream.py
@ -6,7 +6,6 @@ been an outage) and we want to ensure that despite being in debug mode
 actor tree will eventually be cancelled without leaving any zombies.
 '''
 from contextlib import asynccontextmanager as acm
 from functools import partial
 from tractor import (
@ -18,7 +17,6 @@ from tractor import (
    _testing,
 )
 import trio
 import pytest
 async def break_ipc(
@ -43,13 +41,6 @@ async def break_ipc(
        await stream.aclose()
    method: str = method or def_method
    print(
        '#################################\n'
        'Simulating CHILD-side IPC BREAK!\n'
        f'method: {method}\n'
        f'pre `.aclose()`: {pre_close}\n'
        '#################################\n'
    )
    match method:
        case 'trans_aclose':
@ -89,17 +80,17 @@ async def break_ipc_then_error(
    break_ipc_with: str|None = None,
    pre_close: bool = False,
 ):
    await break_ipc(
        stream=stream,
        method=break_ipc_with,
        pre_close=pre_close,
    )
    async for msg in stream:
        await stream.send(msg)
-
+        await break_ipc(
-    assert 0
+            stream=stream,
            method=break_ipc_with,
            pre_close=pre_close,
        )
        assert 0
 # async def close_stream_and_error(
 async def iter_ipc_stream(
    stream: MsgStream,
    break_ipc_with: str|None = None,
@ -108,6 +99,20 @@ async def iter_ipc_stream(
    async for msg in stream:
        await stream.send(msg)
        # wipe out channel right before raising
        # await break_ipc(
        #     stream=stream,
        #     method=break_ipc_with,
        #     pre_close=pre_close,
        # )
        # send channel close msg at SC-prot level
        #
        # TODO: what should get raised here if anything?
        # await stream.aclose()
    # assert 0
@context
 async def recv_and_spawn_net_killers(
@ -129,16 +134,14 @@ async def recv_and_spawn_net_killers(
        async for i in stream:
            print(f'child echoing {i}')
            await stream.send(i)
            if (
                break_ipc_after
                and
-                i >= break_ipc_after
+                i > break_ipc_after
            ):
-                n.start_soon(
+                '#################################\n'
-                    iter_ipc_stream,
+                'Simulating CHILD-side IPC BREAK!\n'
-                    stream,
+                '#################################\n'
                )
                n.start_soon(
                    partial(
                        break_ipc_then_error,
@ -146,23 +149,10 @@ async def recv_and_spawn_net_killers(
                        pre_close=pre_close,
                    )
                )
-
+                n.start_soon(
-
+                    iter_ipc_stream,
-@acm
+                    stream,
-async def stuff_hangin_ctlc(timeout: float = 1) -> None:
+                )
    with trio.move_on_after(timeout) as cs:
        yield timeout
    if cs.cancelled_caught:
        # pretend to be a user seeing no streaming action
        # thinking it's a hang, and then hitting ctl-c..
        print(
            f"i'm a user on the PARENT side and thingz hangin "
            f'after timeout={timeout} ???\n\n'
            'MASHING CTlR-C..!?\n'
        )
        raise KeyboardInterrupt
 async def main(
@ -179,6 +169,9 @@ async def main(
 ) -> None:
    # from tractor._state import _runtime_vars as rtv
    # rtv['_debug_mode'] = debug_mode
    async with (
        open_nursery(
            start_method=start_method,
@ -197,11 +190,10 @@ async def main(
        )
        async with (
            stuff_hangin_ctlc(timeout=2) as timeout,
            _testing.expect_ctxc(
                yay=(
                    break_parent_ipc_after
-                    or break_child_ipc_after
+                    or break_child_ipc_after,
                ),
                # TODO: we CAN'T remove this right?
                # since we need the ctxc to bubble up from either
@ -213,14 +205,12 @@ async def main(
                # and KBI in an eg?
                reraise=True,
            ),
            portal.open_context(
                recv_and_spawn_net_killers,
                break_ipc_after=break_child_ipc_after,
                pre_close=pre_close,
            ) as (ctx, sent),
        ):
            rx_eoc: bool = False
            ipc_break_sent: bool = False
            async with ctx.open_stream() as stream:
                for i in range(1000):
@ -238,7 +228,6 @@ async def main(
                            '#################################\n'
                        )
                        # TODO: other methods? see break func above.
                        # await stream._ctx.chan.send(None)
                        # await stream._ctx.chan.transport.stream.send_eof()
                        await stream._ctx.chan.transport.stream.aclose()
@ -262,12 +251,10 @@ async def main(
                        # TODO: is this needed or no?
                        raise
-                    # timeout: int = 1
+                    timeout: int = 1
-                    # with trio.move_on_after(timeout) as cs:
+                    print(f'Entering `stream.receive()` with timeout={timeout}\n')
-                    async with stuff_hangin_ctlc() as timeout:
+                    with trio.move_on_after(timeout) as cs:
-                        print(
+
                            f'PARENT `stream.receive()` with timeout={timeout}\n'
                        )
                        # NOTE: in the parent side IPC failure case this
                        # will raise an ``EndOfChannel`` after the child
                        # is killed and sends a stop msg back to it's
@ -279,30 +266,23 @@ async def main(
                                f'{rx}\n'
                            )
                        except trio.EndOfChannel:
                            rx_eoc: bool = True
                            print('MsgStream got EoC for PARENT')
                            raise
-            print(
+                    if cs.cancelled_caught:
-                'Streaming finished and we got Eoc.\n'
+                        # pretend to be a user seeing no streaming action
-                'Canceling `.open_context()` in root with\n'
+                        # thinking it's a hang, and then hitting ctl-c..
-                'CTlR-C..'
+                        print(
-            )
+                            f"YOO i'm a PARENT user anddd thingz hangin..\n"
-            if rx_eoc:
+                            f'after timeout={timeout}\n'
-                assert stream.closed
+                        )
                try:
                    await stream.send(i)
                    pytest.fail('stream not closed?')
                except (
                    trio.ClosedResourceError,
                    trio.EndOfChannel,
                ) as send_err:
                    if rx_eoc:
                        assert send_err is stream._eoc
                    else:
                        assert send_err is stream._closed
-            raise KeyboardInterrupt
+                print(
                    "YOO i'm mad!\n"
                    'The send side is dun but thingz hangin..\n'
                    'MASHING CTlR-C Ctl-c..'
                )
                raise KeyboardInterrupt
 if __name__ == '__main__':
--- a/examples/debugging/debug_mode_hang.py
+++ b/examples/debugging/debug_mode_hang.py
@ -1,9 +0,0 @@
 '''
 Reproduce a bug where enabling debug mode for a sub-actor actually causes
 a hang on teardown...
 '''
 import asyncio
 import trio
 import tractor
--- a/examples/parallelism/concurrent_actors_primes.py
+++ b/examples/parallelism/concurrent_actors_primes.py
@ -8,10 +8,7 @@ This uses no extra threads, fancy semaphores or futures; all we need
 is ``tractor``'s channels.
 """
-from contextlib import (
+from contextlib import asynccontextmanager
    asynccontextmanager as acm,
    aclosing,
 )
 from typing import Callable
 import itertools
 import math
@ -19,6 +16,7 @@ import time
 import tractor
 import trio
 from async_generator import aclosing
 PRIMES = [
@ -46,7 +44,7 @@ async def is_prime(n):
    return True
-@acm
+@asynccontextmanager
 async def worker_pool(workers=4):
    """Though it's a trivial special case for ``tractor``, the well
    known "worker pool" seems to be the defacto "but, I want this
--- a/examples/rpc_bidir_streaming.py
+++ b/examples/rpc_bidir_streaming.py
@ -13,7 +13,7 @@ async def simple_rpc(
    '''
    # signal to parent that we're up much like
-    # ``trio.TaskStatus.started()``
+    # ``trio_typing.TaskStatus.started()``
    await ctx.started(data + 1)
    async with ctx.open_stream() as stream:
--- a/pytest.ini
+++ b/pytest.ini
@ -1,8 +0,0 @@
 # vim: ft=ini
 # pytest.ini for tractor
 [pytest]
 # don't show frickin captured logs AGAIN in the report..
 addopts = --show-capture='no'
 log_cli = false
 ; minversion = 6.0
--- a/requirements-test.txt
+++ b/requirements-test.txt
@ -6,3 +6,4 @@ mypy
 trio_typing
 pexpect
 towncrier
 numpy
--- a/setup.py
+++ b/setup.py
@ -46,11 +46,10 @@ setup(
        # trio related
        # proper range spec:
        # https://packaging.python.org/en/latest/discussions/install-requires-vs-requirements/#id5
-        'trio >= 0.24',
+        'trio >= 0.22',
-
+        'async_generator',
-        # 'async_generator',  # in stdlib mostly!
+        'trio_typing',
-        # 'trio_typing',  # trio==0.23.0 has type hints!
+        'exceptiongroup',
        # 'exceptiongroup',  # in stdlib as of 3.11!
        # tooling
        'stackscope',
--- a/tests/conftest.py
+++ b/tests/conftest.py
@ -41,22 +41,43 @@ no_windows = pytest.mark.skipif(
 def pytest_addoption(parser):
    parser.addoption(
-        "--ll", action="store", dest='loglevel',
+        "--ll",
        action="store",
        dest='loglevel',
        default='ERROR', help="logging level to set when testing"
    )
    parser.addoption(
-        "--spawn-backend", action="store", dest='spawn_backend',
+        "--spawn-backend",
        action="store",
        dest='spawn_backend',
        default='trio',
        help="Processing spawning backend to use for test run",
    )
    parser.addoption(
        "--tpdb", "--debug-mode",
        action="store_true",
        dest='tractor_debug_mode',
        # default=False,
        help=(
            'Enable a flag that can be used by tests to to set the '
            '`debug_mode: bool` for engaging the internal '
            'multi-proc debugger sys.'
        ),
    )
 def pytest_configure(config):
    backend = config.option.spawn_backend
    tractor._spawn.try_set_start_method(backend)
@pytest.fixture(scope='session')
 def debug_mode(request):
    return request.config.option.tractor_debug_mode
@pytest.fixture(scope='session', autouse=True)
 def loglevel(request):
    orig = tractor.log._default_loglevel
--- a/tests/test_advanced_faults.py
+++ b/tests/test_advanced_faults.py
@ -85,8 +85,8 @@ def test_ipc_channel_break_during_stream(
    '''
    if spawn_backend != 'trio':
-        if debug_mode:
+    #     if debug_mode:
-            pytest.skip('`debug_mode` only supported on `trio` spawner')
+    #         pytest.skip('`debug_mode` only supported on `trio` spawner')
        # non-`trio` spawners should never hit the hang condition that
        # requires the user to do ctl-c to cancel the actor tree.
@ -107,10 +107,7 @@ def test_ipc_channel_break_during_stream(
        # AND we tell the child to call `MsgStream.aclose()`.
        and pre_aclose_msgstream
    ):
-        # expect_final_exc = trio.EndOfChannel
+        expect_final_exc = trio.EndOfChannel
        # ^XXX NOPE! XXX^ since now `.open_stream()` absorbs this
        # gracefully!
        expect_final_exc = KeyboardInterrupt
    # NOTE when ONLY the child breaks or it breaks BEFORE the
    # parent we expect the parent to get a closed resource error
@ -123,25 +120,11 @@ def test_ipc_channel_break_during_stream(
        and
        ipc_break['break_parent_ipc_after'] is False
    ):
-        # NOTE: we DO NOT expect this any more since
+        expect_final_exc = trio.ClosedResourceError
        # the child side's channel will be broken silently
        # and nothing on the parent side will indicate this!
        # expect_final_exc = trio.ClosedResourceError
-        # NOTE: child will send a 'stop' msg before it breaks
+        # if child calls `MsgStream.aclose()` then expect EoC.
        # the transport channel BUT, that will be absorbed by the
        # `ctx.open_stream()` block and thus the `.open_context()`
        # should hang, after which the test script simulates
        # a user sending ctl-c by raising a KBI.
        if pre_aclose_msgstream:
-            expect_final_exc = KeyboardInterrupt
+            expect_final_exc = trio.EndOfChannel
            # XXX OLD XXX
            # if child calls `MsgStream.aclose()` then expect EoC.
            # ^ XXX not any more ^ since eoc is always absorbed
            # gracefully and NOT bubbled to the `.open_context()`
            # block!
            # expect_final_exc = trio.EndOfChannel
    # BOTH but, CHILD breaks FIRST
    elif (
@ -151,8 +134,12 @@ def test_ipc_channel_break_during_stream(
            > ipc_break['break_child_ipc_after']
        )
    ):
        expect_final_exc = trio.ClosedResourceError
        # child will send a 'stop' msg before it breaks
        # the transport channel.
        if pre_aclose_msgstream:
-            expect_final_exc = KeyboardInterrupt
+            expect_final_exc = trio.EndOfChannel
    # NOTE when the parent IPC side dies (even if the child's does as well
    # but the child fails BEFORE the parent) we always expect the
@ -173,8 +160,7 @@ def test_ipc_channel_break_during_stream(
        ipc_break['break_parent_ipc_after'] is not False
        and (
            ipc_break['break_child_ipc_after']
-            >
+            > ipc_break['break_parent_ipc_after']
            ipc_break['break_parent_ipc_after']
        )
    ):
        expect_final_exc = trio.ClosedResourceError
@ -238,29 +224,25 @@ def test_stream_closed_right_after_ipc_break_and_zombie_lord_engages():
    '''
    async def main():
-        with trio.fail_after(3):
+        async with tractor.open_nursery() as n:
-            async with tractor.open_nursery() as n:
+            portal = await n.start_actor(
-                portal = await n.start_actor(
+                'ipc_breaker',
-                    'ipc_breaker',
+                enable_modules=[__name__],
-                    enable_modules=[__name__],
+            )
                )
-                with trio.move_on_after(1):
+            with trio.move_on_after(1):
-                    async with (
+                async with (
-                        portal.open_context(
+                    portal.open_context(
-                            break_ipc_after_started
+                        break_ipc_after_started
-                        ) as (ctx, sent),
+                    ) as (ctx, sent),
-                    ):
+                ):
-                        async with ctx.open_stream():
+                    async with ctx.open_stream():
-                            await trio.sleep(0.5)
+                        await trio.sleep(0.5)
-                        print('parent waiting on context')
+                    print('parent waiting on context')
-                print(
+            print('parent exited context')
-                    'parent exited context\n'
+            raise KeyboardInterrupt
                    'parent raising KBI..\n'
                )
                raise KeyboardInterrupt
    with pytest.raises(KeyboardInterrupt):
        trio.run(main)
--- a/tests/test_cancellation.py
+++ b/tests/test_cancellation.py
@ -8,6 +8,10 @@ import platform
 import time
 from itertools import repeat
 from exceptiongroup import (
    BaseExceptionGroup,
    ExceptionGroup,
 )
 import pytest
 import trio
 import tractor
--- a/tests/test_child_manages_service_nursery.py
+++ b/tests/test_child_manages_service_nursery.py
@ -6,15 +6,13 @@ sub-sub-actor daemons.
 '''
 from typing import Optional
 import asyncio
-from contextlib import (
+from contextlib import asynccontextmanager as acm
    asynccontextmanager as acm,
    aclosing,
 )
 import pytest
 import trio
 import tractor
 from tractor import RemoteActorError
 from async_generator import aclosing
 async def aio_streamer(
--- a/tests/test_debugger.py
+++ b/tests/test_debugger.py
@ -12,9 +12,11 @@ TODO:
 """
 from functools import partial
 import itertools
 # from os import path
 from typing import Optional
 import platform
 import pathlib
 # import sys
 import time
 import pytest
@ -24,13 +26,13 @@ from pexpect.exceptions import (
    EOF,
 )
 from tractor._testing import (
    examples_dir,
 )
 from tractor.devx._debug import (
    _pause_msg,
    _crash_msg,
 )
 from tractor._testing import (
    examples_dir,
 )
 from conftest import (
    _ci_env,
 )
--- a/tests/test_infected_asyncio.py
+++ b/tests/test_infected_asyncio.py
@ -8,6 +8,7 @@ import builtins
 import itertools
 import importlib
 from exceptiongroup import BaseExceptionGroup
 import pytest
 import trio
 import tractor
@ -19,8 +20,6 @@ from tractor import (
 from tractor.trionics import BroadcastReceiver
 from tractor._testing import expect_ctxc
 from conftest import expect_ctxc
 async def sleep_and_err(
    sleep_for: float = 0.1,
--- a/tests/test_runtime.py
+++ b/tests/test_runtime.py
@ -64,8 +64,7 @@ async def test_lifetime_stack_wipes_tmpfile(
    except (
        tractor.RemoteActorError,
-        # tractor.BaseExceptionGroup,
+        tractor.BaseExceptionGroup,
        BaseExceptionGroup,
    ):
        pass
--- a/tests/test_shm.py
+++ b/tests/test_shm.py
@ -0,0 +1,167 @@
 """
 Shared mem primitives and APIs.
 """
 import uuid
 # import numpy
 import pytest
 import trio
 import tractor
 from tractor._shm import (
    open_shm_list,
    attach_shm_list,
 )
@tractor.context
 async def child_attach_shml_alot(
    ctx: tractor.Context,
    shm_key: str,
 ) -> None:
    await ctx.started(shm_key)
    # now try to attach a boatload of times in a loop..
    for _ in range(1000):
        shml = attach_shm_list(
            key=shm_key,
            readonly=False,
        )
        assert shml.shm.name == shm_key
        await trio.sleep(0.001)
 def test_child_attaches_alot():
    async def main():
        async with tractor.open_nursery() as an:
            # allocate writeable list in parent
            key = f'shml_{uuid.uuid4()}'
            shml = open_shm_list(
                key=key,
            )
            portal = await an.start_actor(
                'shm_attacher',
                enable_modules=[__name__],
            )
            async with (
                portal.open_context(
                    child_attach_shml_alot,
                    shm_key=shml.key,
                ) as (ctx, start_val),
            ):
                assert start_val == key
                await ctx.result()
            await portal.cancel_actor()
    trio.run(main)
@tractor.context
 async def child_read_shm_list(
    ctx: tractor.Context,
    shm_key: str,
    use_str: bool,
    frame_size: int,
 ) -> None:
    # attach in child
    shml = attach_shm_list(
        key=shm_key,
        # dtype=str if use_str else float,
    )
    await ctx.started(shml.key)
    async with ctx.open_stream() as stream:
        async for i in stream:
            print(f'(child): reading shm list index: {i}')
            if use_str:
                expect = str(float(i))
            else:
                expect = float(i)
            if frame_size == 1:
                val = shml[i]
                assert expect == val
                print(f'(child): reading value: {val}')
            else:
                frame = shml[i - frame_size:i]
                print(f'(child): reading frame: {frame}')
@pytest.mark.parametrize(
    'use_str',
    [False, True],
    ids=lambda i: f'use_str_values={i}',
 )
@pytest.mark.parametrize(
    'frame_size',
    [1, 2**6, 2**10],
    ids=lambda i: f'frame_size={i}',
 )
 def test_parent_writer_child_reader(
    use_str: bool,
    frame_size: int,
 ):
    async def main():
        async with tractor.open_nursery(
            # debug_mode=True,
        ) as an:
            portal = await an.start_actor(
                'shm_reader',
                enable_modules=[__name__],
                debug_mode=True,
            )
            # allocate writeable list in parent
            key = 'shm_list'
            seq_size = int(2 * 2 ** 10)
            shml = open_shm_list(
                key=key,
                size=seq_size,
                dtype=str if use_str else float,
                readonly=False,
            )
            async with (
                portal.open_context(
                    child_read_shm_list,
                    shm_key=key,
                    use_str=use_str,
                    frame_size=frame_size,
                ) as (ctx, sent),
                ctx.open_stream() as stream,
            ):
                assert sent == key
                for i in range(seq_size):
                    val = float(i)
                    if use_str:
                        val = str(val)
                    # print(f'(parent): writing {val}')
                    shml[i] = val
                    # only on frame fills do we
                    # signal to the child that a frame's
                    # worth is ready.
                    if (i % frame_size) == 0:
                        print(f'(parent): signalling frame full on {val}')
                        await stream.send(i)
                else:
                    print(f'(parent): signalling final frame on {val}')
                    await stream.send(i)
            await portal.cancel_actor()
    trio.run(main)
--- a/tests/test_trioisms.py
+++ b/tests/test_trioisms.py
@ -5,7 +5,7 @@ want to see changed.
 '''
 import pytest
 import trio
-from trio import TaskStatus
+from trio_typing import TaskStatus
@pytest.mark.parametrize(
--- a/tractor/_context.py
+++ b/tractor/_context.py
@ -169,7 +169,8 @@ async def _drain_to_final_msg(
            # only when we are sure the remote error is
            # the source cause of this local task's
            # cancellation.
-            ctx.maybe_raise()
+            if re := ctx._remote_error:
                ctx._maybe_raise_remote_err(re)
            # CASE 1: we DID request the cancel we simply
            # continue to bubble up as normal.
@ -256,13 +257,6 @@ async def _drain_to_final_msg(
                )
            # XXX fallthrough to handle expected error XXX
            # TODO: replace this with `ctx.maybe_raise()`
            #
            # TODO: would this be handier for this case maybe?
            # async with maybe_raise_on_exit() as raises:
            #     if raises:
            #         log.error('some msg about raising..')
            re: Exception|None = ctx._remote_error
            if re:
                log.critical(
@ -601,7 +595,7 @@ class Context:
        if not re:
            return False
-        if from_uid := re.src_uid:
+        if from_uid := re.src_actor_uid:
            from_uid: tuple = tuple(from_uid)
        our_uid: tuple = self._actor.uid
@ -831,7 +825,7 @@ class Context:
        # cancellation.
        maybe_error_src: tuple = getattr(
            error,
-            'src_uid',
+            'src_actor_uid',
            None,
        )
        self._canceller = (
@ -868,9 +862,6 @@ class Context:
        # TODO: maybe we should also call `._res_scope.cancel()` if it
        # exists to support cancelling any drain loop hangs?
        # NOTE: this usage actually works here B)
        # from .devx._debug import breakpoint
        # await breakpoint()
    # TODO: add to `Channel`?
    @property
@ -1039,8 +1030,8 @@ class Context:
    @acm
    async def open_stream(
        self,
-        allow_overruns: bool|None = False,
+        allow_overruns: bool | None = False,
-        msg_buffer_size: int|None = None,
+        msg_buffer_size: int | None = None,
    ) -> AsyncGenerator[MsgStream, None]:
        '''
@ -1080,16 +1071,13 @@ class Context:
            # absorbed there (silently) and we DO NOT want to
            # actually try to stream - a cancel msg was already
            # sent to the other side!
-            self.maybe_raise(
+            if self._remote_error:
-                raise_ctxc_from_self_call=True,
+                # NOTE: this is diff then calling
-            )
+                # `._maybe_raise_remote_err()` specifically
-            # NOTE: this is diff then calling
+                # because any task entering this `.open_stream()`
-            # `._maybe_raise_remote_err()` specifically
+                # AFTER cancellation has already been requested,
-            # because we want to raise a ctxc on any task entering this `.open_stream()`
+                # we DO NOT want to absorb any ctxc ACK silently!
-            # AFTER cancellation was already been requested,
+                raise self._remote_error
            # we DO NOT want to absorb any ctxc ACK silently!
            # if self._remote_error:
            #     raise self._remote_error
            # XXX NOTE: if no `ContextCancelled` has been responded
            # back from the other side (yet), we raise a different
@ -1170,6 +1158,7 @@ class Context:
                # await trio.lowlevel.checkpoint()
                yield stream
                # XXX: (MEGA IMPORTANT) if this is a root opened process we
                # wait for any immediate child in debug before popping the
                # context from the runtime msg loop otherwise inside
@ -1194,23 +1183,12 @@ class Context:
                #
                # await stream.aclose()
-            # NOTE: absorb and do not raise any
+                # if re := ctx._remote_error:
-            # EoC received from the other side such that
+                #     ctx._maybe_raise_remote_err(
-            # it is not raised inside the surrounding
+                #         re,
-            # context block's scope!
+                #         raise_ctxc_from_self_call=True,
-            except trio.EndOfChannel as eoc:
+                #     )
-                if (
+                # await trio.lowlevel.checkpoint()
                    eoc
                    and stream.closed
                ):
                    # sanity, can remove?
                    assert eoc is stream._eoc
                    # from .devx import pause
                    # await pause()
                    log.warning(
                        'Stream was terminated by EoC\n\n'
                        f'{repr(eoc)}\n'
                    )
            finally:
                if self._portal:
@ -1226,6 +1204,7 @@ class Context:
    # TODO: replace all the instances of this!! XD
    def maybe_raise(
        self,
        hide_tb: bool = True,
        **kwargs,
@ -1409,41 +1388,33 @@ class Context:
                f'{drained_msgs}'
            )
-        self.maybe_raise(
+        if (
-            raise_overrun_from_self=(
+            (re := self._remote_error)
-                raise_overrun
+            # and self._result == res_placeholder
-                and
+        ):
-                # only when we ARE NOT the canceller
+            self._maybe_raise_remote_err(
-                # should we raise overruns, bc ow we're
+                re,
-                # raising something we know might happen
+                # NOTE: obvi we don't care if we
-                # during cancellation ;)
+                # overran the far end if we're already
-                (not self._cancel_called)
+                # waiting on a final result (msg).
                # raise_overrun_from_self=False,
                raise_overrun_from_self=(
                    raise_overrun
                    and
                    # only when we ARE NOT the canceller
                    # should we raise overruns, bc ow we're
                    # raising something we know might happen
                    # during cancellation ;)
                    (not self._cancel_called)
                ),
            )
        )
        # if (
        #     (re := self._remote_error)
        #     # and self._result == res_placeholder
        # ):
        #     self._maybe_raise_remote_err(
        #         re,
        #         # NOTE: obvi we don't care if we
        #         # overran the far end if we're already
        #         # waiting on a final result (msg).
        #         # raise_overrun_from_self=False,
        #         raise_overrun_from_self=(
        #             raise_overrun
        #             and
        #             # only when we ARE NOT the canceller
        #             # should we raise overruns, bc ow we're
        #             # raising something we know might happen
        #             # during cancellation ;)
        #             (not self._cancel_called)
        #         ),
        #     )
            # if maybe_err:
            #     self._result = maybe_err
        return self.outcome
            # None if self._result == res_placeholder
            # else self._result
        # )
    # TODO: switch this with above which should be named
    # `.wait_for_outcome()` and instead do
@ -1892,9 +1863,8 @@ async def open_context_from_portal(
    # TODO: if we set this the wrapping `@acm` body will
    # still be shown (awkwardly) on pdb REPL entry. Ideally
-    # we can similarly annotate that frame to NOT show? for now
+    # we can similarly annotate that frame to NOT show?
-    # we DO SHOW this frame since it's awkward ow..
+    hide_tb: bool = True,
    hide_tb: bool = False,
    # proxied to RPC
    **kwargs,
--- a/tractor/_exceptions.py
+++ b/tractor/_exceptions.py
@ -30,10 +30,11 @@ from typing import (
 import textwrap
 import traceback
 import exceptiongroup as eg
 import trio
-from tractor._state import current_actor
+from ._state import current_actor
-from tractor.log import get_logger
+from .log import get_logger
 if TYPE_CHECKING:
    from ._context import Context
@ -372,6 +373,7 @@ def unpack_error(
        for ns in [
            builtins,
            _this_mod,
            eg,
            trio,
        ]:
            if suberror_type := getattr(
@ -394,13 +396,12 @@ def unpack_error(
 def is_multi_cancelled(exc: BaseException) -> bool:
    '''
-    Predicate to determine if a possible ``BaseExceptionGroup`` contains
+    Predicate to determine if a possible ``eg.BaseExceptionGroup`` contains
    only ``trio.Cancelled`` sub-exceptions (and is likely the result of
    cancelling a collection of subtasks.
    '''
-    # if isinstance(exc, eg.BaseExceptionGroup):
+    if isinstance(exc, eg.BaseExceptionGroup):
    if isinstance(exc, BaseExceptionGroup):
        return exc.subgroup(
            lambda exc: isinstance(exc, trio.Cancelled)
        ) is not None
--- a/tractor/_root.py
+++ b/tractor/_root.py
@ -28,13 +28,12 @@ import os
 import warnings
 from exceptiongroup import BaseExceptionGroup
 import trio
 from ._runtime import (
    Actor,
    Arbiter,
    # TODO: rename and make a non-actor subtype?
    # Arbiter as Registry,
    async_main,
 )
 from .devx import _debug
@ -326,10 +325,10 @@ async def open_root_actor(
            ) as err:
                entered: bool = await _debug._maybe_enter_pm(err)
                if (
                    not entered
-                    and
+                    and not is_multi_cancelled(err)
                    not is_multi_cancelled(err)
                ):
                    logger.exception('Root actor crashed:\n')
--- a/tractor/_rpc.py
+++ b/tractor/_rpc.py
@ -21,7 +21,6 @@ Remote (task) Procedure Call (scheduling) with SC transitive semantics.
 from __future__ import annotations
 from contextlib import (
    asynccontextmanager as acm,
    aclosing,
 )
 from functools import partial
 import inspect
@ -35,12 +34,17 @@ from typing import (
 )
 import warnings
 from async_generator import aclosing
 from exceptiongroup import BaseExceptionGroup
 import trio
 from trio import (
    CancelScope,
    Nursery,
    TaskStatus,
 )
 # from trio_typing import (
 #     TaskStatus,
 # )
 from .msg import NamespacePath
 from ._ipc import Channel
--- a/tractor/_runtime.py
+++ b/tractor/_runtime.py
@ -45,7 +45,6 @@ from functools import partial
 from itertools import chain
 import importlib
 import importlib.util
 import os
 from pprint import pformat
 import signal
 import sys
@ -56,11 +55,14 @@ from typing import (
 )
 import uuid
 from types import ModuleType
 import os
 import warnings
 import trio
 from trio import (
    CancelScope,
 )
 from trio_typing import (
    Nursery,
    TaskStatus,
 )
@ -78,7 +80,11 @@ from ._exceptions import (
    ContextCancelled,
    TransportClosed,
 )
-from .devx import _debug
+from .devx import (
    # pause,
    maybe_wait_for_debugger,
    _debug,
 )
 from ._discovery import get_registry
 from ._portal import Portal
 from . import _state
@ -96,7 +102,7 @@ if TYPE_CHECKING:
 log = get_logger('tractor')
-def _get_mod_abspath(module):
+def _get_mod_abspath(module: ModuleType) -> str:
    return os.path.abspath(module.__file__)
@ -388,12 +394,6 @@ class Actor:
        self._no_more_peers = trio.Event()  # unset by making new
        chan = Channel.from_stream(stream)
        their_uid: tuple[str, str]|None = chan.uid
        if their_uid:
            log.warning(
                f'Re-connection from already known {their_uid}'
            )
        else:
           log.runtime(f'New connection to us @{chan.raddr}')
        con_msg: str = ''
        if their_uid:
@ -665,7 +665,7 @@ class Actor:
                                f'last disconnected child uid: {uid}\n'
                                f'locking child uid: {pdb_user_uid}\n'
                            )
-                            await _debug.maybe_wait_for_debugger(
+                            await maybe_wait_for_debugger(
                                child_in_debug=True
                            )
@ -717,12 +717,10 @@ class Actor:
                        f'|_{chan}\n'
                    )
                    try:
-                        # send msg loop terminate sentinel which
+                        # send a msg loop terminate sentinel
                        # triggers cancellation of all remotely
                        # started tasks.
                        await chan.send(None)
-                        # XXX: do we want this? no right?
+                        # XXX: do we want this?
                        # causes "[104] connection reset by peer" on other end
                        # await chan.aclose()
@ -1212,10 +1210,10 @@ class Actor:
            # - callee self raises ctxc before caller send request,
            # - callee errors prior to cancel req.
            log.cancel(
-                'Cancel request invalid, RPC task already completed?\n\n'
+                'Cancel request invalid, RPC task already completed?\n'
                f'<= canceller: {requesting_uid}\n\n'
-                f'=> {cid}@{parent_chan.uid}\n'
+                f'=>{parent_chan}\n'
-                f'  |_{parent_chan}\n'
+                f'  |_ctx-id: {cid}\n'
            )
            return True
@ -1394,8 +1392,8 @@ class Actor:
    @property
    def accept_addrs(self) -> list[tuple[str, int]]:
        '''
-        All addresses to which the transport-channel server binds
+        All addresses to which the IPC-transport-channel server
-        and listens for new connections.
+        binds and listens for new connections.
        '''
        # throws OSError on failure
@ -1514,6 +1512,7 @@ async def async_main(
            ):
                accept_addrs = set_accept_addr_says_rent
        # The "root" nursery ensures the channel with the immediate
        # parent is kept alive as a resilient service until
        # cancellation steps have (mostly) occurred in
@ -1567,9 +1566,9 @@ async def async_main(
                    # tranport address bind errors - normally it's
                    # something silly like the wrong socket-address
                    # passed via a config or CLI Bo
-                    entered_debug: bool = await _debug._maybe_enter_pm(oserr)
+                    entered_debug = await _debug._maybe_enter_pm(oserr)
-                    if not entered_debug:
+                    if entered_debug:
-                        log.exception('Failed to init IPC channel server !?\n')
+                        log.runtime('Exited debug REPL..')
                    raise
                accept_addrs: list[tuple[str, int]] = actor.accept_addrs
--- a/tractor/_shm.py
+++ b/tractor/_shm.py
@ -0,0 +1,833 @@
 # tractor: structured concurrent "actors".
 # Copyright 2018-eternity Tyler Goodlet.
 # This program is free software: you can redistribute it and/or modify
 # it under the terms of the GNU Affero General Public License as published by
 # the Free Software Foundation, either version 3 of the License, or
 # (at your option) any later version.
 # This program is distributed in the hope that it will be useful,
 # but WITHOUT ANY WARRANTY; without even the implied warranty of
 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 # GNU Affero General Public License for more details.
 # You should have received a copy of the GNU Affero General Public License
 # along with this program.  If not, see <https://www.gnu.org/licenses/>.
 """
 SC friendly shared memory management geared at real-time
 processing.
 Support for ``numpy`` compatible array-buffers is provided but is
 considered optional within the context of this runtime-library.
 """
 from __future__ import annotations
 from sys import byteorder
 import time
 from typing import Optional
 from multiprocessing import shared_memory as shm
 from multiprocessing.shared_memory import (
    SharedMemory,
    ShareableList,
 )
 from msgspec import Struct
 import tractor
 from .log import get_logger
 _USE_POSIX = getattr(shm, '_USE_POSIX', False)
 if _USE_POSIX:
    from _posixshmem import shm_unlink
 try:
    import numpy as np
    from numpy.lib import recfunctions as rfn
    import nptyping
 except ImportError:
    pass
 log = get_logger(__name__)
 def disable_mantracker():
    '''
    Disable all ``multiprocessing``` "resource tracking" machinery since
    it's an absolute multi-threaded mess of non-SC madness.
    '''
    from multiprocessing import resource_tracker as mantracker
    # Tell the "resource tracker" thing to fuck off.
    class ManTracker(mantracker.ResourceTracker):
        def register(self, name, rtype):
            pass
        def unregister(self, name, rtype):
            pass
        def ensure_running(self):
            pass
    # "know your land and know your prey"
    # https://www.dailymotion.com/video/x6ozzco
    mantracker._resource_tracker = ManTracker()
    mantracker.register = mantracker._resource_tracker.register
    mantracker.ensure_running = mantracker._resource_tracker.ensure_running
    mantracker.unregister = mantracker._resource_tracker.unregister
    mantracker.getfd = mantracker._resource_tracker.getfd
 disable_mantracker()
 class SharedInt:
    '''
    Wrapper around a single entry shared memory array which
    holds an ``int`` value used as an index counter.
    '''
    def __init__(
        self,
        shm: SharedMemory,
    ) -> None:
        self._shm = shm
    @property
    def value(self) -> int:
        return int.from_bytes(self._shm.buf, byteorder)
    @value.setter
    def value(self, value) -> None:
        self._shm.buf[:] = value.to_bytes(self._shm.size, byteorder)
    def destroy(self) -> None:
        if _USE_POSIX:
            # We manually unlink to bypass all the "resource tracker"
            # nonsense meant for non-SC systems.
            name = self._shm.name
            try:
                shm_unlink(name)
            except FileNotFoundError:
                # might be a teardown race here?
                log.warning(f'Shm for {name} already unlinked?')
 class NDToken(Struct, frozen=True):
    '''
    Internal represenation of a shared memory ``numpy`` array "token"
    which can be used to key and load a system (OS) wide shm entry
    and correctly read the array by type signature.
    This type is msg safe.
    '''
    shm_name: str  # this servers as a "key" value
    shm_first_index_name: str
    shm_last_index_name: str
    dtype_descr: tuple
    size: int  # in struct-array index / row terms
    # TODO: use nptyping here on dtypes
    @property
    def dtype(self) -> list[tuple[str, str, tuple[int, ...]]]:
        return np.dtype(
            list(
                map(tuple, self.dtype_descr)
            )
        ).descr
    def as_msg(self):
        return self.to_dict()
    @classmethod
    def from_msg(cls, msg: dict) -> NDToken:
        if isinstance(msg, NDToken):
            return msg
        # TODO: native struct decoding
        # return _token_dec.decode(msg)
        msg['dtype_descr'] = tuple(map(tuple, msg['dtype_descr']))
        return NDToken(**msg)
 # _token_dec = msgspec.msgpack.Decoder(NDToken)
 # TODO: this api?
 # _known_tokens = tractor.ActorVar('_shm_tokens', {})
 # _known_tokens = tractor.ContextStack('_known_tokens', )
 # _known_tokens = trio.RunVar('shms', {})
 # TODO: this should maybe be provided via
 # a `.trionics.maybe_open_context()` wrapper factory?
 # process-local store of keys to tokens
 _known_tokens: dict[str, NDToken] = {}
 def get_shm_token(key: str) -> NDToken | None:
    '''
    Convenience func to check if a token
    for the provided key is known by this process.
    Returns either the ``numpy`` token or a string for a shared list.
    '''
    return _known_tokens.get(key)
 def _make_token(
    key: str,
    size: int,
    dtype: np.dtype,
 ) -> NDToken:
    '''
    Create a serializable token that can be used
    to access a shared array.
    '''
    return NDToken(
        shm_name=key,
        shm_first_index_name=key + "_first",
        shm_last_index_name=key + "_last",
        dtype_descr=tuple(np.dtype(dtype).descr),
        size=size,
    )
 class ShmArray:
    '''
    A shared memory ``numpy.ndarray`` API.
    An underlying shared memory buffer is allocated based on
    a user specified ``numpy.ndarray``. This fixed size array
    can be read and written to by pushing data both onto the "front"
    or "back" of a set index range. The indexes for the "first" and
    "last" index are themselves stored in shared memory (accessed via
    ``SharedInt`` interfaces) values such that multiple processes can
    interact with the same array using a synchronized-index.
    '''
    def __init__(
        self,
        shmarr: np.ndarray,
        first: SharedInt,
        last: SharedInt,
        shm: SharedMemory,
        # readonly: bool = True,
    ) -> None:
        self._array = shmarr
        # indexes for first and last indices corresponding
        # to fille data
        self._first = first
        self._last = last
        self._len = len(shmarr)
        self._shm = shm
        self._post_init: bool = False
        # pushing data does not write the index (aka primary key)
        self._write_fields: list[str] | None = None
        dtype = shmarr.dtype
        if dtype.fields:
            self._write_fields = list(shmarr.dtype.fields.keys())[1:]
    # TODO: ringbuf api?
    @property
    def _token(self) -> NDToken:
        return NDToken(
            shm_name=self._shm.name,
            shm_first_index_name=self._first._shm.name,
            shm_last_index_name=self._last._shm.name,
            dtype_descr=tuple(self._array.dtype.descr),
            size=self._len,
        )
    @property
    def token(self) -> dict:
        """Shared memory token that can be serialized and used by
        another process to attach to this array.
        """
        return self._token.as_msg()
    @property
    def index(self) -> int:
        return self._last.value % self._len
    @property
    def array(self) -> np.ndarray:
        '''
        Return an up-to-date ``np.ndarray`` view of the
        so-far-written data to the underlying shm buffer.
        '''
        a = self._array[self._first.value:self._last.value]
        # first, last = self._first.value, self._last.value
        # a = self._array[first:last]
        # TODO: eventually comment this once we've not seen it in the
        # wild in a long time..
        # XXX: race where first/last indexes cause a reader
        # to load an empty array..
        if len(a) == 0 and self._post_init:
            raise RuntimeError('Empty array race condition hit!?')
            # breakpoint()
        return a
    def ustruct(
        self,
        fields: Optional[list[str]] = None,
        # type that all field values will be cast to
        # in the returned view.
        common_dtype: np.dtype = float,
    ) -> np.ndarray:
        array = self._array
        if fields:
            selection = array[fields]
            # fcount = len(fields)
        else:
            selection = array
            # fcount = len(array.dtype.fields)
        # XXX: manual ``.view()`` attempt that also doesn't work.
        # uview = selection.view(
        #     dtype='<f16',
        # ).reshape(-1, 4, order='A')
        # assert len(selection) == len(uview)
        u = rfn.structured_to_unstructured(
            selection,
            # dtype=float,
            copy=True,
        )
        # unstruct = np.ndarray(u.shape, dtype=a.dtype, buffer=shm.buf)
        # array[:] = a[:]
        return u
        # return ShmArray(
        #     shmarr=u,
        #     first=self._first,
        #     last=self._last,
        #     shm=self._shm
        # )
    def last(
        self,
        length: int = 1,
    ) -> np.ndarray:
        '''
        Return the last ``length``'s worth of ("row") entries from the
        array.
        '''
        return self.array[-length:]
    def push(
        self,
        data: np.ndarray,
        field_map: Optional[dict[str, str]] = None,
        prepend: bool = False,
        update_first: bool = True,
        start: int | None = None,
    ) -> int:
        '''
        Ring buffer like "push" to append data
        into the buffer and return updated "last" index.
        NB: no actual ring logic yet to give a "loop around" on overflow
        condition, lel.
        '''
        length = len(data)
        if prepend:
            index = (start or self._first.value) - length
            if index < 0:
                raise ValueError(
                    f'Array size of {self._len} was overrun during prepend.\n'
                    f'You have passed {abs(index)} too many datums.'
                )
        else:
            index = start if start is not None else self._last.value
        end = index + length
        if field_map:
            src_names, dst_names = zip(*field_map.items())
        else:
            dst_names = src_names = self._write_fields
        try:
            self._array[
                list(dst_names)
            ][index:end] = data[list(src_names)][:]
            # NOTE: there was a race here between updating
            # the first and last indices and when the next reader
            # tries to access ``.array`` (which due to the index
            # overlap will be empty). Pretty sure we've fixed it now
            # but leaving this here as a reminder.
            if (
                prepend
                and update_first
                and length
            ):
                assert index < self._first.value
            if (
                index < self._first.value
                and update_first
            ):
                assert prepend, 'prepend=True not passed but index decreased?'
                self._first.value = index
            elif not prepend:
                self._last.value = end
            self._post_init = True
            return end
        except ValueError as err:
            if field_map:
                raise
            # should raise if diff detected
            self.diff_err_fields(data)
            raise err
    def diff_err_fields(
        self,
        data: np.ndarray,
    ) -> None:
        # reraise with any field discrepancy
        our_fields, their_fields = (
            set(self._array.dtype.fields),
            set(data.dtype.fields),
        )
        only_in_ours = our_fields - their_fields
        only_in_theirs = their_fields - our_fields
        if only_in_ours:
            raise TypeError(
                f"Input array is missing field(s): {only_in_ours}"
            )
        elif only_in_theirs:
            raise TypeError(
                f"Input array has unknown field(s): {only_in_theirs}"
            )
    # TODO: support "silent" prepends that don't update ._first.value?
    def prepend(
        self,
        data: np.ndarray,
    ) -> int:
        end = self.push(data, prepend=True)
        assert end
    def close(self) -> None:
        self._first._shm.close()
        self._last._shm.close()
        self._shm.close()
    def destroy(self) -> None:
        if _USE_POSIX:
            # We manually unlink to bypass all the "resource tracker"
            # nonsense meant for non-SC systems.
            shm_unlink(self._shm.name)
        self._first.destroy()
        self._last.destroy()
    def flush(self) -> None:
        # TODO: flush to storage backend like markestore?
        ...
 def open_shm_ndarray(
    size: int,
    key: str | None = None,
    dtype: np.dtype | None = None,
    append_start_index: int | None = None,
    readonly: bool = False,
 ) -> ShmArray:
    '''
    Open a memory shared ``numpy`` using the standard library.
    This call unlinks (aka permanently destroys) the buffer on teardown
    and thus should be used from the parent-most accessor (process).
    '''
    # create new shared mem segment for which we
    # have write permission
    a = np.zeros(size, dtype=dtype)
    a['index'] = np.arange(len(a))
    shm = SharedMemory(
        name=key,
        create=True,
        size=a.nbytes
    )
    array = np.ndarray(
        a.shape,
        dtype=a.dtype,
        buffer=shm.buf
    )
    array[:] = a[:]
    array.setflags(write=int(not readonly))
    token = _make_token(
        key=key,
        size=size,
        dtype=dtype,
    )
    # create single entry arrays for storing an first and last indices
    first = SharedInt(
        shm=SharedMemory(
            name=token.shm_first_index_name,
            create=True,
            size=4,  # std int
        )
    )
    last = SharedInt(
        shm=SharedMemory(
            name=token.shm_last_index_name,
            create=True,
            size=4,  # std int
        )
    )
    # Start the "real-time" append-updated (or "pushed-to") section
    # after some start index: ``append_start_index``. This allows appending
    # from a start point in the array which isn't the 0 index and looks
    # something like,
    # -------------------------
    # |              |        i
    # _________________________
    # <-------------> <------->
    #  history         real-time
    #
    # Once fully "prepended", the history section will leave the
    # ``ShmArray._start.value: int = 0`` and the yet-to-be written
    # real-time section will start at ``ShmArray.index: int``.
    # this sets the index to nearly 2/3rds into the the length of
    # the buffer leaving at least a "days worth of second samples"
    # for the real-time section.
    if append_start_index is None:
        append_start_index = round(size * 0.616)
    last.value = first.value = append_start_index
    shmarr = ShmArray(
        array,
        first,
        last,
        shm,
    )
    assert shmarr._token == token
    _known_tokens[key] = shmarr.token
    # "unlink" created shm on process teardown by
    # pushing teardown calls onto actor context stack
    stack = tractor.current_actor().lifetime_stack
    stack.callback(shmarr.close)
    stack.callback(shmarr.destroy)
    return shmarr
 def attach_shm_ndarray(
    token: tuple[str, str, tuple[str, str]],
    readonly: bool = True,
 ) -> ShmArray:
    '''
    Attach to an existing shared memory array previously
    created by another process using ``open_shared_array``.
    No new shared mem is allocated but wrapper types for read/write
    access are constructed.
    '''
    token = NDToken.from_msg(token)
    key = token.shm_name
    if key in _known_tokens:
        assert NDToken.from_msg(_known_tokens[key]) == token, "WTF"
    # XXX: ugh, looks like due to the ``shm_open()`` C api we can't
    # actually place files in a subdir, see discussion here:
    # https://stackoverflow.com/a/11103289
    # attach to array buffer and view as per dtype
    _err: Optional[Exception] = None
    for _ in range(3):
        try:
            shm = SharedMemory(
                name=key,
                create=False,
            )
            break
        except OSError as oserr:
            _err = oserr
            time.sleep(0.1)
    else:
        if _err:
            raise _err
    shmarr = np.ndarray(
        (token.size,),
        dtype=token.dtype,
        buffer=shm.buf
    )
    shmarr.setflags(write=int(not readonly))
    first = SharedInt(
        shm=SharedMemory(
            name=token.shm_first_index_name,
            create=False,
            size=4,  # std int
        ),
    )
    last = SharedInt(
        shm=SharedMemory(
            name=token.shm_last_index_name,
            create=False,
            size=4,  # std int
        ),
    )
    # make sure we can read
    first.value
    sha = ShmArray(
        shmarr,
        first,
        last,
        shm,
    )
    # read test
    sha.array
    # Stash key -> token knowledge for future queries
    # via `maybe_opepn_shm_array()` but only after we know
    # we can attach.
    if key not in _known_tokens:
        _known_tokens[key] = token
    # "close" attached shm on actor teardown
    tractor.current_actor().lifetime_stack.callback(sha.close)
    return sha
 def maybe_open_shm_ndarray(
    key: str,  # unique identifier for segment
    size: int,
    dtype: np.dtype | None = None,
    append_start_index: int = 0,
    readonly: bool = True,
 ) -> tuple[ShmArray, bool]:
    '''
    Attempt to attach to a shared memory block using a "key" lookup
    to registered blocks in the users overall "system" registry
    (presumes you don't have the block's explicit token).
    This function is meant to solve the problem of discovering whether
    a shared array token has been allocated or discovered by the actor
    running in **this** process. Systems where multiple actors may seek
    to access a common block can use this function to attempt to acquire
    a token as discovered by the actors who have previously stored
    a "key" -> ``NDToken`` map in an actor local (aka python global)
    variable.
    If you know the explicit ``NDToken`` for your memory segment instead
    use ``attach_shm_array``.
    '''
    try:
        # see if we already know this key
        token = _known_tokens[key]
        return (
            attach_shm_ndarray(
                token=token,
                readonly=readonly,
            ),
            False,  # not newly opened
        )
    except KeyError:
        log.warning(f"Could not find {key} in shms cache")
        if dtype:
            token = _make_token(
                key,
                size=size,
                dtype=dtype,
            )
        else:
            try:
                return (
                    attach_shm_ndarray(
                        token=token,
                        readonly=readonly,
                    ),
                    False,
                )
            except FileNotFoundError:
                log.warning(f"Could not attach to shm with token {token}")
        # This actor does not know about memory
        # associated with the provided "key".
        # Attempt to open a block and expect
        # to fail if a block has been allocated
        # on the OS by someone else.
        return (
            open_shm_ndarray(
                key=key,
                size=size,
                dtype=dtype,
                append_start_index=append_start_index,
                readonly=readonly,
            ),
            True,
        )
 class ShmList(ShareableList):
    '''
    Carbon copy of ``.shared_memory.ShareableList`` with a few
    enhancements:
    - readonly mode via instance var flag  `._readonly: bool`
    - ``.__getitem__()`` accepts ``slice`` inputs
    - exposes the underlying buffer "name" as a ``.key: str``
    '''
    def __init__(
        self,
        sequence: list | None = None,
        *,
        name: str | None = None,
        readonly: bool = True
    ) -> None:
        self._readonly = readonly
        self._key = name
        return super().__init__(
            sequence=sequence,
            name=name,
        )
    @property
    def key(self) -> str:
        return self._key
    @property
    def readonly(self) -> bool:
        return self._readonly
    def __setitem__(
        self,
        position,
        value,
    ) -> None:
        # mimick ``numpy`` error
        if self._readonly:
            raise ValueError('assignment destination is read-only')
        return super().__setitem__(position, value)
    def __getitem__(
        self,
        indexish,
    ) -> list:
        # NOTE: this is a non-writeable view (copy?) of the buffer
        # in a new list instance.
        if isinstance(indexish, slice):
            return list(self)[indexish]
        return super().__getitem__(indexish)
    # TODO: should we offer a `.array` and `.push()` equivalent
    # to the `ShmArray`?
    # currently we have the following limitations:
    # - can't write slices of input using traditional slice-assign
    #   syntax due to the ``ShareableList.__setitem__()`` implementation.
    # - ``list(shmlist)`` returns a non-mutable copy instead of
    #   a writeable view which would be handier numpy-style ops.
 def open_shm_list(
    key: str,
    sequence: list | None = None,
    size: int = int(2 ** 10),
    dtype: float | int | bool | str | bytes | None = float,
    readonly: bool = True,
 ) -> ShmList:
    if sequence is None:
        default = {
            float: 0.,
            int: 0,
            bool: True,
            str: 'doggy',
            None: None,
        }[dtype]
        sequence = [default] * size
    shml = ShmList(
        sequence=sequence,
        name=key,
        readonly=readonly,
    )
    # "close" attached shm on actor teardown
    try:
        actor = tractor.current_actor()
        actor.lifetime_stack.callback(shml.shm.close)
        actor.lifetime_stack.callback(shml.shm.unlink)
    except RuntimeError:
        log.warning('tractor runtime not active, skipping teardown steps')
    return shml
 def attach_shm_list(
    key: str,
    readonly: bool = False,
 ) -> ShmList:
    return ShmList(
        name=key,
        readonly=readonly,
    )
--- a/tractor/_spawn.py
+++ b/tractor/_spawn.py
@ -31,24 +31,25 @@ from typing import (
    TYPE_CHECKING,
 )
 from exceptiongroup import BaseExceptionGroup
 import trio
-from trio import TaskStatus
+from trio_typing import TaskStatus
-from .devx._debug import (
+from .devx import (
    maybe_wait_for_debugger,
    acquire_debug_lock,
 )
-from tractor._state import (
+from ._state import (
    current_actor,
    is_main_process,
    is_root_process,
    debug_mode,
 )
-from tractor.log import get_logger
+from .log import get_logger
-from tractor._portal import Portal
+from ._portal import Portal
-from tractor._runtime import Actor
+from ._runtime import Actor
-from tractor._entry import _mp_main
+from ._entry import _mp_main
-from tractor._exceptions import ActorFailure
+from ._exceptions import ActorFailure
 if TYPE_CHECKING:
@ -220,10 +221,6 @@ async def hard_kill(
    # whilst also hacking on it XD
    # terminate_after: int = 99999,
    # NOTE: for mucking with `.pause()`-ing inside the runtime
    # whilst also hacking on it XD
    # terminate_after: int = 99999,
 ) -> None:
    '''
    Un-gracefully terminate an OS level `trio.Process` after timeout.
--- a/tractor/_streaming.py
+++ b/tractor/_streaming.py
@ -136,7 +136,7 @@ class MsgStream(trio.abc.Channel):
        #         return await self.receive()
        #     except trio.EndOfChannel:
        #         raise StopAsyncIteration
-        #
+
        # see ``.aclose()`` for notes on the old behaviour prior to
        # introducing this
        if self._eoc:
@ -152,6 +152,7 @@ class MsgStream(trio.abc.Channel):
                return msg['yield']
            except KeyError as kerr:
                # log.exception('GOT KEYERROR')
                src_err = kerr
                # NOTE: may raise any of the below error types
@ -165,20 +166,30 @@ class MsgStream(trio.abc.Channel):
                    stream=self,
                )
-        # XXX: the stream terminates on either of:
+        # XXX: we close the stream on any of these error conditions:
        # - via `self._rx_chan.receive()` raising  after manual closure
        #   by the rpc-runtime OR,
        # - via a received `{'stop': ...}` msg from remote side.
        #   |_ NOTE: previously this was triggered by calling
        #   ``._rx_chan.aclose()`` on the send side of the channel inside
        #   `Actor._push_result()`, but now the 'stop' message handling
        #   has been put just above inside `_raise_from_no_key_in_msg()`.
        except (
-            trio.EndOfChannel,
+            # trio.ClosedResourceError,  # by self._rx_chan
            trio.EndOfChannel,  # by self._rx_chan or `stop` msg from far end
        ) as eoc:
            # log.exception('GOT EOC')
            src_err = eoc
            self._eoc = eoc
            # a ``ClosedResourceError`` indicates that the internal
            # feeder memory receive channel was closed likely by the
            # runtime after the associated transport-channel
            # disconnected or broke.
            # an ``EndOfChannel`` indicates either the internal recv
            # memchan exhausted **or** we raisesd it just above after
            # receiving a `stop` message from the far end of the stream.
            # Previously this was triggered by calling ``.aclose()`` on
            # the send side of the channel inside
            # ``Actor._push_result()`` (should still be commented code
            # there - which should eventually get removed), but now the
            # 'stop' message handling has been put just above.
            # TODO: Locally, we want to close this stream gracefully, by
            # terminating any local consumers tasks deterministically.
            # Once we have broadcast support, we **don't** want to be
@ -199,11 +210,8 @@ class MsgStream(trio.abc.Channel):
            # raise eoc
-        # a ``ClosedResourceError`` indicates that the internal
+        except trio.ClosedResourceError as cre:  # by self._rx_chan
-        # feeder memory receive channel was closed likely by the
+            # log.exception('GOT CRE')
        # runtime after the associated transport-channel
        # disconnected or broke.
        except trio.ClosedResourceError as cre:  # by self._rx_chan.receive()
            src_err = cre
            log.warning(
                '`Context._rx_chan` was already closed?'
@ -229,30 +237,15 @@ class MsgStream(trio.abc.Channel):
        # over the end-of-stream connection error since likely
        # the remote error was the source cause?
        ctx: Context = self._ctx
-        ctx.maybe_raise(
+        if re := ctx._remote_error:
-            raise_ctxc_from_self_call=True,
+            ctx._maybe_raise_remote_err(
-        )
+                re,
                raise_ctxc_from_self_call=True,
            )
-        # propagate any error but hide low-level frame details
+        # propagate any error but hide low-level frames from
-        # from the caller by default for debug noise reduction.
+        # caller by default.
-        if (
+        if hide_tb:
            hide_tb
            # XXX NOTE XXX don't reraise on certain
            # stream-specific internal error types like,
            #
            # - `trio.EoC` since we want to use the exact instance
            #   to ensure that it is the error that bubbles upward
            #   for silent absorption by `Context.open_stream()`.
            and not self._eoc
            # - `RemoteActorError` (or `ContextCancelled`) if it gets
            #   raised from `_raise_from_no_key_in_msg()` since we
            #   want the same (as the above bullet) for any
            #   `.open_context()` block bubbled error raised by
            #   any nearby ctx API remote-failures.
            # and not isinstance(src_err, RemoteActorError)
        ):
            raise type(src_err)(*src_err.args) from src_err
        else:
            raise src_err
@ -377,10 +370,6 @@ class MsgStream(trio.abc.Channel):
        #         await rx_chan.aclose()
        if not self._eoc:
            log.cancel(
                'Stream closed before it received an EoC?\n'
                'Setting eoc manually..\n..'
            )
            self._eoc: bool = trio.EndOfChannel(
                f'Context stream closed by {self._ctx.side}\n'
                f'|_{self}\n'
@ -425,11 +414,13 @@ class MsgStream(trio.abc.Channel):
    @property
    def closed(self) -> bool:
-
+        if (
-        rxc: bool = self._rx_chan._closed
+            (rxc := self._rx_chan._closed)
-        _closed: bool|Exception = self._closed
+            or
-        _eoc: bool|trio.EndOfChannel = self._eoc
+            (_closed := self._closed)
-        if rxc or _closed or _eoc:
+            or
            (_eoc := self._eoc)
        ):
            log.runtime(
                f'`MsgStream` is already closed\n'
                f'{self}\n'
@ -505,11 +496,7 @@ class MsgStream(trio.abc.Channel):
        '''
        __tracebackhide__: bool = hide_tb
        # raise any alreay known error immediately
        self._ctx.maybe_raise()
        if self._eoc:
            raise self._eoc
        if self._closed:
            raise self._closed
--- a/tractor/_supervise.py
+++ b/tractor/_supervise.py
@ -26,6 +26,7 @@ from typing import TYPE_CHECKING
 import typing
 import warnings
 from exceptiongroup import BaseExceptionGroup
 import trio
 from .devx._debug import maybe_wait_for_debugger
--- a/tractor/experimental/_pubsub.py
+++ b/tractor/experimental/_pubsub.py
@ -31,7 +31,7 @@ from typing import (
    Callable,
 )
 from functools import partial
-from contextlib import aclosing
+from async_generator import aclosing
 import trio
 import wrapt
--- a/tractor/trionics/_mngrs.py
+++ b/tractor/trionics/_mngrs.py
@ -33,9 +33,10 @@ from typing import (
 )
 import trio
 from trio_typing import TaskStatus
-from tractor._state import current_actor
+from .._state import current_actor
-from tractor.log import get_logger
+from ..log import get_logger
 log = get_logger(__name__)
@ -183,7 +184,7 @@ class _Cache:
        cls,
        mng,
        ctx_key: tuple,
-        task_status: trio.TaskStatus[T] = trio.TASK_STATUS_IGNORED,
+        task_status: TaskStatus[T] = trio.TASK_STATUS_IGNORED,
    ) -> None:
        async with mng as value: