6 changed files with 314 additions and 309 deletions
--- a/piker/data/_ahab.py
+++ b/piker/data/_ahab.py
@ -24,6 +24,7 @@ from typing import (
    # Any,
 )
 from contextlib import asynccontextmanager as acm
+# import time

 import trio
 from trio_typing import TaskStatus
@ -96,7 +97,6 @@ async def open_docker(
            base_url=url,
            **kwargs
        ) if url else docker.from_env(**kwargs)
-
        yield client

    except (
@ -127,10 +127,43 @@ async def open_docker(

    finally:
        if client:
+            # for c in client.containers.list():
+            #     c.kill()
            client.close()
            # client.api._custom_adapter.close()
-            for c in client.containers.list():
-                c.kill()
+
+
+# async def waitfor(
+#     cntr: Container,
+#     attr_path: tuple[str],
+#     expect=None,
+#     timeout: float = 0.5,
+
+# ) -> Any:
+#     '''
+#     Wait for a container's attr value to be set. If ``expect`` is
+#     provided wait for the value to be set to that value.
+
+#     This is an async version of the helper from our ``pytest-dockerctl``
+#     plugin.
+
+#     '''
+#     def get(val, path):
+#         for key in path:
+#             val = val[key]
+#         return val
+
+#     start = time.time()
+#     while time.time() - start < timeout:
+#         cntr.reload()
+#         val = get(cntr.attrs, attr_path)
+#         if expect is None and val:
+#             return val
+#         elif val == expect:
+#             return val
+#     else:
+#         raise TimeoutError("{} failed to be {}, value: \"{}\"".format(
+#             attr_path, expect if expect else 'not None', val))


@tractor.context
@ -187,7 +220,7 @@ async def open_marketstored(
            },
            mounts=[config_dir_mnt, data_dir_mnt],
            detach=True,
-            # stop_signal='SIGINT',
+            stop_signal='SIGINT',
            init=True,
            # remove=True,
        )
@ -214,7 +247,7 @@ async def open_marketstored(
                        seen_so_far.add(entry)
                        if bp_on_msg:
                            await tractor.breakpoint()
-                        getattr(log, level, log.error)(f'{msg}')
+                        getattr(log, level)(f'{msg}')

                    # if "launching tcp listener for all services..." in msg:
                    if match in msg:
@ -236,8 +269,6 @@ async def open_marketstored(
                    )

            await ctx.started(cntr.id)
-
-            # block for the expected "teardown log msg"..
            await process_logs_until('exiting...',)

        except (
--- a/piker/data/_source.py
+++ b/piker/data/_source.py
@ -22,7 +22,8 @@ from typing import Any
 import decimal

 import numpy as np
-from pydantic import BaseModel
+import pandas as pd
+from pydantic import BaseModel, validate_arguments
 # from numba import from_dtype


@ -253,6 +254,61 @@ class Symbol(BaseModel):
        return keys


+def from_df(
+
+    df: pd.DataFrame,
+    source=None,
+    default_tf=None
+
+) -> np.recarray:
+    """Convert OHLC formatted ``pandas.DataFrame`` to ``numpy.recarray``.
+
+    """
+    df.reset_index(inplace=True)
+
+    # hackery to convert field names
+    date = 'Date'
+    if 'date' in df.columns:
+        date = 'date'
+
+    # convert to POSIX time
+    df[date] = [d.timestamp() for d in df[date]]
+
+    # try to rename from some camel case
+    columns = {
+        'Date': 'time',
+        'date': 'time',
+        'Open': 'open',
+        'High': 'high',
+        'Low': 'low',
+        'Close': 'close',
+        'Volume': 'volume',
+
+        # most feeds are providing this over sesssion anchored
+        'vwap': 'bar_wap',
+
+        # XXX: ib_insync calls this the "wap of the bar"
+        # but no clue what is actually is...
+        # https://github.com/pikers/piker/issues/119#issuecomment-729120988
+        'average': 'bar_wap',
+    }
+
+    df = df.rename(columns=columns)
+
+    for name in df.columns:
+        # if name not in base_ohlc_dtype.names[1:]:
+        if name not in base_ohlc_dtype.names:
+            del df[name]
+
+    # TODO: it turns out column access on recarrays is actually slower:
+    # https://jakevdp.github.io/PythonDataScienceHandbook/02.09-structured-data-numpy.html#RecordArrays:-Structured-Arrays-with-a-Twist
+    # it might make sense to make these structured arrays?
+    array = df.to_records(index=False)
+    _nan_to_closest_num(array)
+
+    return array
+
+
 def _nan_to_closest_num(array: np.ndarray):
    """Return interpolated values instead of NaN.

--- a/piker/data/cli.py
+++ b/piker/data/cli.py
@ -126,7 +126,7 @@ def ms_stream(
 )
@click.argument('symbols', nargs=-1)
@click.pass_obj
-def storesh(
+def ms_shell(
    config,
    tl,
    host,
@ -137,18 +137,43 @@ def storesh(
    Start an IPython shell ready to query the local marketstore db.

    '''
-    from piker.data.marketstore import tsdb_history_update
+    from piker.data.marketstore import backfill_history_diff
    from piker._daemon import open_piker_runtime

    async def main():
        nonlocal symbols

        async with open_piker_runtime(
-            'storesh',
+            'ms_shell',
            enable_modules=['piker.data._ahab'],
        ):
-            symbol = symbols[0]
-            await tsdb_history_update(symbol)
+            try:
+                await backfill_history_diff()
+            except OSError:
+                # TODO: write magics to query marketstore
+
+                sym = symbols[0]
+                symbol, _, broker = sym.rpartition('.')
+                # (maybe) allocate shm array for this broker/symbol which will
+                # be used for fast near-term history capture and processing.
+                shm, opened = maybe_open_shm_array(
+                    key=sym,
+                    dtype=base_iohlc_dtype,
+                )
+                # load anything found in shm
+                from numpy.lib.recfunctions import structured_to_unstructured
+                mxmn = structured_to_unstructured(
+                    shm.array[['low', 'high']],
+                    # dtype=[('mxmn', '<f8'), ('index', '<i8')],
+                ).flatten()
+
+                from piker.ui._compression import downsample
+                xd, yd = downsample(
+                    y=mxmn,
+                    x=np.arange(len(mxmn)),
+                    bins=4,
+                )
+                await tractor.breakpoint()

    trio.run(main)

@ -159,11 +184,10 @@ def storesh(
@click.argument('name', nargs=1, required=True)
@click.pass_obj
 def ingest(config, name, test_file, tl):
-    '''
-    Ingest real-time broker quotes and ticks to a marketstore instance.
-
-    '''
+    """Ingest real-time broker quotes and ticks to a marketstore instance.
+    """
    # global opts
+    brokermods = config['brokermods']
    loglevel = config['loglevel']
    tractorloglevel = config['tractorloglevel']
    # log = config['log']
--- a/piker/data/feed.py
+++ b/piker/data/feed.py
@ -22,6 +22,7 @@ This module is enabled for ``brokerd`` daemons.
 """
 from __future__ import annotations
 from dataclasses import dataclass, field
+from datetime import datetime
 from contextlib import asynccontextmanager
 from functools import partial
 from types import ModuleType
@ -31,14 +32,11 @@ from typing import (
    Awaitable,
 )

-
-import pendulum
 import trio
 from trio.abc import ReceiveChannel
 from trio_typing import TaskStatus
 import tractor
 from pydantic import BaseModel
-import numpy as np

 from ..brokers import get_brokermod
 from .._cacheables import maybe_open_context
@ -51,6 +49,7 @@ from ._sharedmem import (
    maybe_open_shm_array,
    attach_shm_array,
    ShmArray,
+    _secs_in_day,
 )
 from .ingest import get_ingestormod
 from ._source import (
@ -193,22 +192,6 @@ async def _setup_persistent_brokerd(
        await trio.sleep_forever()


-async def start_backfill(
-    mod: ModuleType,
-    fqsn: str,
-    shm: ShmArray,
-
-    task_status: TaskStatus[trio.CancelScope] = trio.TASK_STATUS_IGNORED,
-
-) -> int:
-
-    return await mod.backfill_bars(
-        fqsn,
-        shm,
-        task_status=task_status,
-    )
-
-
 async def manage_history(
    mod: ModuleType,
    bus: _FeedsBus,
@ -237,102 +220,40 @@ async def manage_history(
        # we expect the sub-actor to write
        readonly=False,
    )
-    # TODO: history validation
-    if not opened:
-        raise RuntimeError(
-            "Persistent shm for sym was already open?!"
-        )

    log.info('Scanning for existing `marketstored`')
-
    is_up = await check_for_service('marketstored')
-
-    # for now only do backfilling if no tsdb can be found
-    do_legacy_backfill = not is_up and opened
-
-    open_history_client = getattr(mod, 'open_history_client', None)
-
-    if is_up and opened and open_history_client:
-
+    if is_up and opened:
        log.info('Found existing `marketstored`')
        from . import marketstore

        async with marketstore.open_storage_client(
            fqsn,
-        ) as storage:
+        ) as (storage, tsdb_arrays):

-            tsdb_arrays = await storage.read_ohlcv(fqsn)
+            # TODO: history validation
+            # assert opened, f'Persistent shm for {symbol} was already open?!'
+            # if not opened:
+            #     raise RuntimeError(
+            #         "Persistent shm for sym was already open?!"
+            #     )

-            if not tsdb_arrays:
-                do_legacy_backfill = True
-
-            else:
+            if tsdb_arrays:
                log.info(f'Loaded tsdb history {tsdb_arrays}')
-
-                fastest = list(tsdb_arrays.values())[0]
-                times = fastest['Epoch']
-                first, last = times[0], times[-1]
-                first_tsdb_dt, last_tsdb_dt = map(
-                    pendulum.from_timestamp, [first, last]
-                )
-
-                # TODO: this should be used verbatim for the pure
-                # shm backfiller approach below.
-
-                def diff_history(
-                    array,
-                    start_dt,
-                    end_dt,
-
-                ) -> np.ndarray:
-
-                    s_diff = (last_tsdb_dt - start_dt).seconds
-
-                    # if we detect a partial frame's worth of data
-                    # that is new, slice out only that history and
-                    # write to shm.
-                    if s_diff > 0:
-                        assert last_tsdb_dt > start_dt
-                        selected = array['time'] > last_tsdb_dt.timestamp()
-                        to_push = array[selected]
-                        log.info(
-                            f'Pushing partial frame {to_push.size} to shm'
-                        )
-                        return to_push
-
-                    else:
-                        return array
-
-                # start history anal and load missing new data via backend.
-                async with open_history_client(fqsn) as hist:
-
-                    # get latest query's worth of history all the way
-                    # back to what is recorded in the tsdb
-                    array, start_dt, end_dt = await hist(end_dt='')
-                    to_push = diff_history(array, start_dt, end_dt)
-                    shm.push(to_push)
-
-                    # let caller unblock and deliver latest history frame
-                    task_status.started(shm)
-                    some_data_ready.set()
-
-                    # pull new history frames until we hit latest
-                    # already in the tsdb
-                    while start_dt > last_tsdb_dt:
-                        array, start_dt, end_dt = await hist(end_dt=start_dt)
-                        to_push = diff_history(array, start_dt, end_dt)
-                        shm.push(to_push, prepend=True)
+                fastest = list(tsdb_arrays[fqsn].values())[0]
+                last_s = fastest['Epoch'][-1]

                # TODO: see if there's faster multi-field reads:
                # https://numpy.org/doc/stable/user/basics.rec.html#accessing-multiple-fields
+
                # re-index  with a `time` and index field
                shm.push(
-                        fastest[-shm._first.value:],
+                    fastest[-3 * _secs_in_day:],

                    # insert the history pre a "days worth" of samples
                    # to leave some real-time buffer space at the end.
                    prepend=True,
-                        # start=shm._len - _secs_in_day,
+                    start=shm._len - _secs_in_day,
                    field_map={
                        'Epoch': 'time',
                        'Open': 'open',
@ -343,23 +264,24 @@ async def manage_history(
                    },
                )

-                    # TODO: write new data to tsdb to be ready to for next
-                    # read.
+                # start history anal and load missing new data via backend.
+                async with mod.open_history_client(fqsn) as hist:

-    if do_legacy_backfill:
-        # do a legacy incremental backfill from the provider.
+                    # get latest query's worth of history
+                    array, next_dt = await hist(end_dt='')
+
+                    last_dt = datetime.fromtimestamp(last_s)
+                    array, next_dt = await hist(end_dt=last_dt)
+
+            some_data_ready.set()
+
+    elif opened:
        log.info('No existing `marketstored` found..')

-        bfqsn = fqsn.replace('.' + mod.name, '')
        # start history backfill task ``backfill_bars()`` is
        # a required backend func this must block until shm is
        # filled with first set of ohlc bars
-        await bus.nursery.start(
-            start_backfill,
-            mod,
-            bfqsn,
-            shm,
-        )
+        _ = await bus.nursery.start(mod.backfill_bars, fqsn, shm)

    # yield back after client connect with filled shm
    task_status.started(shm)
@ -369,18 +291,33 @@ async def manage_history(
    # data that can be used.
    some_data_ready.set()

-    # history retreival loop depending on user interaction and thus
-    # a small RPC-prot for remotely controllinlg what data is loaded
-    # for viewing.
+    # detect sample step size for sampled historical data
+    times = shm.array['time']
+    delay_s = times[-1] - times[times != times[-1]][-1]
+
+    # begin real-time updates of shm and tsb once the feed
+    # goes live.
+    await feed_is_live.wait()
+
+    if opened:
+        sampler.ohlcv_shms.setdefault(delay_s, []).append(shm)
+
+        # start shm incrementing for OHLC sampling at the current
+        # detected sampling period if one dne.
+        if sampler.incrementers.get(delay_s) is None:
+            await bus.start_task(
+                increment_ohlc_buffer,
+                delay_s,
+            )
+
    await trio.sleep_forever()
+    # cs.cancel()


 async def allocate_persistent_feed(
    bus: _FeedsBus,
-
    brokername: str,
    symbol: str,
-
    loglevel: str,
    start_stream: bool = True,

@ -400,7 +337,6 @@ async def allocate_persistent_feed(
    - a real-time streaming task which connec

    '''
-    # load backend module
    try:
        mod = get_brokermod(brokername)
    except ImportError:
@ -425,10 +361,8 @@ async def allocate_persistent_feed(
            loglevel=loglevel,
        )
    )
-    # the broker-specific fully qualified symbol name,
-    # but ensure it is lower-cased for external use.
-    bfqsn = init_msg[symbol]['fqsn'].lower()
-    init_msg[symbol]['fqsn'] = bfqsn
+    # the broker-specific fully qualified symbol name
+    bfqsn = init_msg[symbol]['fqsn']

    # HISTORY, run 2 tasks:
    # - a history loader / maintainer
@ -443,7 +377,7 @@ async def allocate_persistent_feed(
        manage_history,
        mod,
        bus,
-        '.'.join((bfqsn, brokername)),
+        bfqsn,
        some_data_ready,
        feed_is_live,
    )
@ -456,11 +390,9 @@ async def allocate_persistent_feed(

    # true fqsn
    fqsn = '.'.join((bfqsn, brokername))
+
    # add a fqsn entry that includes the ``.<broker>`` suffix
-    # and an entry that includes the broker-specific fqsn (including
-    # any new suffixes or elements as injected by the backend).
    init_msg[fqsn] = msg
-    init_msg[bfqsn] = msg

    # TODO: pretty sure we don't need this? why not just leave 1s as
    # the fastest "sample period" since we'll probably always want that
@ -474,14 +406,13 @@ async def allocate_persistent_feed(
    await some_data_ready.wait()

    # append ``.<broker>`` suffix to each quote symbol
-    acceptable_not_fqsn_with_broker_suffix = symbol + f'.{brokername}'
-
+    bsym = symbol + f'.{brokername}'
    generic_first_quotes = {
-        acceptable_not_fqsn_with_broker_suffix: first_quote,
+        bsym: first_quote,
        fqsn: first_quote,
    }

-    bus.feeds[symbol] = bus.feeds[bfqsn] = (
+    bus.feeds[symbol] = bus.feeds[fqsn] = (
        init_msg,
        generic_first_quotes,
    )
@ -494,22 +425,9 @@ async def allocate_persistent_feed(
    if not start_stream:
        await trio.sleep_forever()

-    # begin real-time updates of shm and tsb once the feed goes live and
-    # the backend will indicate when real-time quotes have begun.
+    # backend will indicate when real-time quotes have begun.
    await feed_is_live.wait()

-    # start shm incrementer task for OHLC style sampling
-    # at the current detected step period.
-    times = shm.array['time']
-    delay_s = times[-1] - times[times != times[-1]][-1]
-
-    sampler.ohlcv_shms.setdefault(delay_s, []).append(shm)
-    if sampler.incrementers.get(delay_s) is None:
-        await bus.start_task(
-            increment_ohlc_buffer,
-            delay_s,
-        )
-
    sum_tick_vlm: bool = init_msg.get(
        'shm_write_opts', {}
    ).get('sum_tick_vlm', True)
@ -532,7 +450,7 @@ async def open_feed_bus(

    ctx: tractor.Context,
    brokername: str,
-    symbol: str,  # normally expected to the broker-specific fqsn
+    symbol: str,
    loglevel: str,
    tick_throttle:  Optional[float] = None,
    start_stream: bool = True,
@ -554,9 +472,7 @@ async def open_feed_bus(
    # TODO: check for any stale shm entries for this symbol
    # (after we also group them in a nice `/dev/shm/piker/` subdir).
    # ensure we are who we think we are
-    servicename = tractor.current_actor().name
-    assert 'brokerd' in servicename
-    assert brokername in servicename
+    assert 'brokerd' in tractor.current_actor().name

    bus = get_feed_bus(brokername)

@ -566,7 +482,7 @@ async def open_feed_bus(
    entry = bus.feeds.get(symbol)
    if entry is None:
        # allocate a new actor-local stream bus which
-        # will persist for this `brokerd`'s service lifetime.
+        # will persist for this `brokerd`.
        async with bus.task_lock:
            await bus.nursery.start(
                partial(
@ -590,12 +506,12 @@ async def open_feed_bus(
    init_msg, first_quotes = bus.feeds[symbol]

    msg = init_msg[symbol]
-    bfqsn = msg['fqsn'].lower()
+    bfqsn = msg['fqsn']

    # true fqsn
    fqsn = '.'.join([bfqsn, brokername])
    assert fqsn in first_quotes
-    assert bus.feeds[bfqsn]
+    assert bus.feeds[fqsn]

    # broker-ambiguous symbol (provided on cli - eg. mnq.globex.ib)
    bsym = symbol + f'.{brokername}'
@ -909,10 +825,7 @@ async def maybe_open_feed(

    **kwargs,

-) -> (
-    Feed,
-    ReceiveChannel[dict[str, Any]],
-):
+) -> (Feed, ReceiveChannel[dict[str, Any]]):
    '''
    Maybe open a data to a ``brokerd`` daemon only if there is no
    local one for the broker-symbol pair, if one is cached use it wrapped
@ -933,7 +846,6 @@ async def maybe_open_feed(
            'start_stream': kwargs.get('start_stream', True),
        },
        key=fqsn,
-
    ) as (cache_hit, feed):

        if cache_hit:
--- a/piker/data/marketstore.py
+++ b/piker/data/marketstore.py
@ -29,13 +29,14 @@ from typing import (
    Any,
    Optional,
    Union,
+    # Callable,
+    # TYPE_CHECKING,
 )
 import time
 from math import isnan

 from bidict import bidict
 import msgpack
-import pyqtgraph as pg
 import numpy as np
 import pandas as pd
 import tractor
@ -48,8 +49,15 @@ from anyio_marketstore import (
 import purerpc

 from .feed import maybe_open_feed
+from ._source import (
+    mk_fqsn,
+    # Symbol,
+)
 from ..log import get_logger, get_console_log

+# if TYPE_CHECKING:
+#     from ._sharedmem import ShmArray
+

 log = get_logger(__name__)

@ -227,16 +235,6 @@ class Storage:
        # series' cache from tsdb reads
        self._arrays: dict[str, np.ndarray] = {}

-    async def list_keys(self) -> list[str]:
-        return await self.client.list_symbols()
-
-    async def search_keys(self, pattern: str) -> list[str]:
-        '''
-        Search for time series key in the storage backend.
-
-        '''
-        ...
-
    async def write_ticks(self, ticks: list) -> None:
        ...

@ -258,29 +256,14 @@ class Storage:
        if fqsn not in syms:
            return {}

-        tfstr = tf_in_1s[1]
-
-        params = Params(
-            symbols=fqsn,
-            timeframe=tfstr,
-            attrgroup='OHLCV',
-            # limit_from_start=True,
-
-            # TODO: figure the max limit here given the
-            # ``purepc`` msg size limit of purerpc: 33554432
-            limit=int(800e3),
-        )
-
        if timeframe is None:
            log.info(f'starting {fqsn} tsdb granularity scan..')
            # loop through and try to find highest granularity
            for tfstr in tf_in_1s.values():
                try:
                    log.info(f'querying for {tfstr}@{fqsn}')
-                    params.set('timeframe', tfstr)
-                    result = await client.query(params)
+                    result = await client.query(Params(fqsn, tfstr, 'OHLCV',))
                    break
-
                except purerpc.grpclib.exceptions.UnknownError:
                    # XXX: this is already logged by the container and
                    # thus shows up through `marketstored` logs relay.
@ -290,11 +273,9 @@ class Storage:
                return {}

        else:
-            result = await client.query(params)
+            tfstr = tf_in_1s[timeframe]
+            result = await client.query(Params(fqsn, tfstr, 'OHLCV',))

-        # TODO: it turns out column access on recarrays is actually slower:
-        # https://jakevdp.github.io/PythonDataScienceHandbook/02.09-structured-data-numpy.html#RecordArrays:-Structured-Arrays-with-a-Twist
-        # it might make sense to make these structured arrays?
        # Fill out a `numpy` array-results map
        arrays = {}
        for fqsn, data_set in result.by_symbols().items():
@ -302,22 +283,7 @@ class Storage:
                tf_in_1s.inverse[data_set.timeframe]
            ] = data_set.array

-        return arrays[fqsn][timeframe] if timeframe else arrays[fqsn]
-
-    async def delete_ts(
-        self,
-        key: str,
-        timeframe: Optional[Union[int, str]] = None,
-
-    ) -> bool:
-
-        client = self.client
-        syms = await client.list_symbols()
-        print(syms)
-        # if key not in syms:
-        #     raise KeyError(f'`{fqsn}` table key not found?')
-
-        return await client.destroy(tbk=key)
+        return arrays[fqsn][timeframe] if timeframe else arrays


@acm
@ -330,16 +296,19 @@ async def open_storage_client(
    Load a series by key and deliver in ``numpy`` struct array format.

    '''
-    async with (
-        # eventually a storage backend endpoint
-        get_client() as client,
-    ):
-        # slap on our wrapper api
-        yield Storage(client)
+    async with get_client() as client:
+
+        storage_client = Storage(client)
+        arrays = await storage_client.read_ohlcv(
+            fqsn,
+            period,
+        )
+
+        yield storage_client, arrays


-async def tsdb_history_update(
-    fqsn: str,
+async def backfill_history_diff(
+    # symbol: Symbol

 ) -> list[str]:

@ -369,64 +338,73 @@ async def tsdb_history_update(
    #   * the original data feed arch blurb:
    #     - https://github.com/pikers/piker/issues/98
    #
-    profiler = pg.debug.Profiler(
-        disabled=False,  # not pg_profile_enabled(),
-        delayed=False,
-    )
+
+    broker = 'ib'
+    symbol = 'mnq.globex'
+
+    # broker = 'binance'
+    # symbol = 'btcusdt'
+
+    fqsn = mk_fqsn(broker, symbol)

    async with (
-        open_storage_client(fqsn) as storage,
-
+        get_client() as client,
        maybe_open_feed(
-            [fqsn],
+            broker,
+            [symbol],
+            loglevel='info',
+            # backpressure=False,
            start_stream=False,

        ) as (feed, stream),
    ):
-        profiler(f'opened feed for {fqsn}')
-
-        symbol = feed.symbols.get(fqsn)
-        if symbol:
-            fqsn = symbol.front_fqsn()
-
-        syms = await storage.client.list_symbols()
-        log.info(f'Existing tsdb symbol set:\n{pformat(syms)}')
-        profiler(f'listed symbols {syms}')
+        syms = await client.list_symbols()
+        log.info(f'Existing symbol set:\n{pformat(syms)}')

        # diff db history with shm and only write the missing portions
        ohlcv = feed.shm.array

-        # TODO: use pg profiler
-        tsdb_arrays = await storage.read_ohlcv(fqsn)
+        key = (fqsn, '1Sec', 'OHLCV')
+        tbk = mk_tbk(key)

-        to_append = feed.shm.array
-        to_prepend = None
+        # diff vs. existing array and append new history
+        # TODO:

-        # hist diffing
-        if tsdb_arrays:
-            onesec = tsdb_arrays[1]
-            to_append = ohlcv[ohlcv['time'] > onesec['Epoch'][-1]]
-            to_prepend = ohlcv[ohlcv['time'] < onesec['Epoch'][0]]
+        # TODO: should be no error?
+        # assert not resp.responses

-        profiler('Finished db arrays diffs')
+        start = time.time()

-        for array in [to_append, to_prepend]:
-            if array is None:
-                continue
+        qr = await client.query(
+            # Params(fqsn, '1Sec`', 'OHLCV',)
+            Params(*key),
+        )
+        # # Dig out `numpy` results map
+        arrays: dict[tuple[str, int], np.ndarray] = {}
+        for name, data_set in qr.by_symbols().items():
+            in_secs = tf_in_1s.inverse[data_set.timeframe]
+            arrays[(name, in_secs)] = data_set.array
+
+        s1 = arrays[(fqsn, 1)]
+        to_append = ohlcv[ohlcv['time'] > s1['Epoch'][-1]]
+
+        end_diff = time.time()
+        diff_ms = round((end_diff - start) * 1e3, ndigits=2)

        log.info(
-                f'Writing datums {array.size} -> to tsdb from shm\n'
+            f'Appending {to_append.size} datums to tsdb from shm\n'
+            f'Total diff time: {diff_ms} ms'
        )

        # build mkts schema compat array for writing
        mkts_dt = np.dtype(_ohlcv_dt)
        mkts_array = np.zeros(
-                len(array),
+            len(to_append),
            dtype=mkts_dt,
        )
        # copy from shm array (yes it's this easy):
        # https://numpy.org/doc/stable/user/basics.rec.html#assignment-from-other-structured-arrays
-            mkts_array[:] = array[[
+        mkts_array[:] = to_append[[
            'time',
            'open',
            'high',
@ -436,28 +414,32 @@ async def tsdb_history_update(
        ]]

        # write to db
-            resp = await storage.client.write(
+        resp = await client.write(
            mkts_array,
-                tbk=f'{fqsn}/1Sec/OHLCV',
-
+            tbk=tbk,
            # NOTE: will will append duplicates
            # for the same timestamp-index.
-                # TODO: pre deduplicate?
            isvariablelength=True,
        )
-
+        end_write = time.time()
+        diff_ms = round((end_write - end_diff) * 1e3, ndigits=2)
        log.info(
            f'Wrote {to_append.size} datums to tsdb\n'
+            f'Total write time: {diff_ms} ms'
        )
-            profiler('Finished db writes')
-
        for resp in resp.responses:
            err = resp.error
            if err:
                raise MarketStoreError(err)

-        from tractor.trionics import ipython_embed
-        await ipython_embed()
+        # TODO: backfiller loop
+        from piker.ui._compression import downsample
+        x, y = downsample(
+            s1['Epoch'],
+            s1['Close'],
+            bins=10,
+        )
+        await tractor.breakpoint()


 async def ingest_quote_stream(
--- a/scripts/ib_data_reset.py
+++ b/scripts/ib_data_reset.py
@ -54,7 +54,7 @@ for name in win_names:
        # disconnect?
        for key_combo, timeout in [
            # only required if we need a connection reset.
-            # ('ctrl+alt+r', 12),
+            ('ctrl+alt+r', 12),
            # data feed reset.
            ('ctrl+alt+f', 6)
        ]: