Finally write a general purpose null-gap detector!

Using a bunch of fancy `numpy` vec ops (and ideally eventually extending the same to `polars`) this is a first draft of `get_null_segs()` a `col: str` field-value-is-zero detector which filters to all zero-valued input frame segments and returns the corresponding useful slice-indexes: - gap absolute (in shm buffer terms) index-endpoints as `absi_zsegs` for slicing to each null-segment in the src frame. - ALL abs indices of rows with zeroed `col` values as `absi_zeros`. - the full set of the input frame's row-entries (view) which are null valued for the chosen `col` as `zero_t`. Use this new null-segment-detector in the `.data.history.start_backfill()` task to attempt to fill null gaps that might be extant from some prior backfill attempt. Since `get_null_segs()` should now deliver a sequence of slices for each gap we don't really need to have the `while gap_indices:` loop any more, so just move that to the end-of-func and warn log (for now) if all gaps aren't eventually filled. TODO: -[ ] do the null-seg detection and filling concurrently from most-recent-frame backfilling. -[ ] offer the same detection in `.storage.cli` cmds for manual tsp anal. -[ ] make the graphics layer actually update correctly when null-segs are filled (currently still broken somehow in the `Viz` caching layer?) CHERRY INTO #486
pikers · Dec 13, 2023 · c129f5b · c129f5b
1 parent c4853a3
commit c129f5b
Show file tree

Hide file tree

Showing 2 changed files with 279 additions and 156 deletions.
diff --git a/piker/data/history.py b/piker/data/history.py
@@ -56,7 +56,13 @@
 from ._sampling import (
     open_sample_stream,
 )
-from . import tsp
+from .tsp import (
+    dedupe,
+    get_null_segs,
+    sort_diff,
+    Frame,
+    Seq,
+)
 from ..brokers._util import (
     DataUnavailable,
 )
@@ -158,6 +164,100 @@ async def shm_push_in_between(
         # await tractor.pause()
 
 
+async def maybe_fill_null_segments(
+    shm: ShmArray,
+    timeframe: float,
+    get_hist: Callable,
+    sampler_stream: tractor.MsgStream,
+    mkt: MktPair,
+
+) -> list[Frame]:
+
+    frame: Frame = shm.array
+
+    null_segs: tuple | None = get_null_segs(
+        frame,
+        period=timeframe,
+    )
+    if null_segs:
+        absi_pairs_zsegs: list[list[float, float]]
+        izeros: Seq
+        zero_t: Frame
+        (
+            absi_pairs_zsegs,
+            izeros,
+            zero_t,
+        ) = null_segs
+
+        absi_first: int = frame[0]['index']
+        for absi_start, absi_end in absi_pairs_zsegs:
+            # await tractor.pause()
+            fi_start = absi_start - absi_first
+            fi_end = absi_end - absi_first
+            start_row: Seq = frame[fi_start]
+            end_row: Seq = frame[fi_end]
+
+            start_t: float = start_row['time']
+            end_t: float = end_row['time']
+
+            start_dt = from_timestamp(start_t)
+            end_dt = from_timestamp(end_t)
+
+            # if we get a badly ordered timestamp
+            # pair, immediately stop backfilling.
+            if end_dt < start_dt:
+                break
+
+            (
+                array,
+                next_start_dt,
+                next_end_dt,
+            ) = await get_hist(
+                timeframe,
+                start_dt=start_dt,
+                end_dt=end_dt,
+            )
+
+            # XXX TODO: pretty sure if i plot tsla, btcusdt.binance
+            # and mnq.cme.ib this causes a Qt crash XXDDD
+
+            # make sure we don't overrun the buffer start
+            len_to_push: int = min(absi_end, array.size)
+            to_push: np.ndarray = array[-len_to_push:]
+
+            await shm_push_in_between(
+                shm,
+                to_push,
+                prepend_index=absi_end,
+                update_start_on_prepend=False,
+            )
+
+            # TODO: UI side needs IPC event to update..
+            # - make sure the UI actually always handles
+            #  this update!
+            # - remember that in the display side, only refersh this
+            #   if the respective history is actually "in view".
+            #   loop
+            await sampler_stream.send({
+                'broadcast_all': {
+                    'backfilling': (mkt.fqme, timeframe),
+                },
+            })
+
+        # RECHECK for more null-gaps
+        frame: Frame = shm.array
+        null_segs: tuple | None = get_null_segs(
+            frame,
+            period=timeframe,
+        )
+        if (
+            null_segs
+            and
+            len(null_segs[-1])
+        ):
+            await tractor.pause()
+
+
 async def start_backfill(
     get_hist,
     mod: ModuleType,
@@ -224,16 +324,20 @@ async def start_backfill(
         # per time stamp.
         # starts: Counter[datetime] = Counter()
 
-        # conduct "backward history gap filling" where we push to
-        # the shm buffer until we have history back until the
-        # latest entry loaded from the tsdb's table B)
+        # STAGE NOTE: "backward history gap filling":
+        # - we push to the shm buffer until we have history back
+        #   until the latest entry loaded from the tsdb's table B)
+        # - after this loop continue to check for other gaps in the
+        #   (tsdb) history and (at least report) maybe fill them
+        #   from new frame queries to the backend?
         last_start_dt: datetime = backfill_from_dt
         next_prepend_index: int = backfill_from_shm_index
 
         while last_start_dt > backfill_until_dt:
-
-            log.debug(
-                f'Requesting {timeframe}s frame ending in {last_start_dt}'
+            log.info(
+                f'Requesting {timeframe}s frame:\n'
+                f'backfill_until_dt: {backfill_until_dt}\n'
+                f'last_start_dt: {last_start_dt}\n'
             )
 
             try:
@@ -261,45 +365,29 @@ async def start_backfill(
                     await tractor.pause()
                 return
 
-            # TODO: drop this? see todo above..
-            # if (
-            #     next_start_dt in starts
-            #     and starts[next_start_dt] <= 6
-            # ):
-            #     start_dt = min(starts)
-            #     log.warning(
-            #         f"{mkt.fqme}: skipping duplicate frame @ {next_start_dt}"
-            #     )
-            #     starts[start_dt] += 1
-            #     await tractor.pause()
-            #     continue
-
-            # elif starts[next_start_dt] > 6:
-            #     log.warning(
-            #         f'NO-MORE-DATA: backend {mod.name} before {next_start_dt}?'
-            #     )
-            #     return
-
-            # # only update new start point if not-yet-seen
-            # starts[next_start_dt] += 1
-
-            assert array['time'][0] == next_start_dt.timestamp()
+            assert (
+                array['time'][0]
+                ==
+                next_start_dt.timestamp()
+            )
 
             diff = last_start_dt - next_start_dt
             frame_time_diff_s = diff.seconds
 
             # frame's worth of sample-period-steps, in seconds
-            frame_size_s = len(array) * timeframe
-            expected_frame_size_s = frame_size_s + timeframe
+            frame_size_s: float = len(array) * timeframe
+            expected_frame_size_s: float = frame_size_s + timeframe
             if frame_time_diff_s > expected_frame_size_s:
 
                 # XXX: query result includes a start point prior to our
                 # expected "frame size" and thus is likely some kind of
                 # history gap (eg. market closed period, outage, etc.)
                 # so just report it to console for now.
                 log.warning(
-                    f'History frame ending @ {last_start_dt} appears to have a gap:\n'
-                    f'{diff} ~= {frame_time_diff_s} seconds'
+                    'GAP DETECTED:\n'
+                    f'last_start_dt: {last_start_dt}\n'
+                    f'diff: {diff}\n'
+                    f'frame_time_diff_s: {frame_time_diff_s}\n'
                 )
 
             to_push = diff_history(
@@ -415,74 +503,32 @@ async def start_backfill(
                     gaps,
                     deduped,
                     diff,
-                ) = tsp.dedupe(df)
+                ) = dedupe(df)
                 if diff:
-                    tsp.sort_diff(df)
+                    sort_diff(df)
 
         else:
             # finally filled gap
             log.info(
                 f'Finished filling gap to tsdb start @ {backfill_until_dt}!'
             )
-            # conduct tsdb timestamp gap detection and backfill any
-            # seemingly missing sequence segments..
-            # TODO: ideally these never exist but somehow it seems
-            # sometimes we're writing zero-ed segments on certain
-            # (teardown) cases?
-            from .tsp import detect_null_time_gap
-
-            gap_indices: tuple | None = detect_null_time_gap(shm)
-            while gap_indices:
-                (
-                    istart,
-                    start,
-                    end,
-                    iend,
-                ) = gap_indices
-
-                start_dt = from_timestamp(start)
-                end_dt = from_timestamp(end)
 
-                # if we get a baddly ordered timestamp
-                # pair, imeeditately stop backfilling.
-                if end_dt < start_dt:
-                    break
+            # NOTE: conduct tsdb timestamp gap detection and backfill any
+            # seemingly missing (null-time) segments..
 
-                (
-                    array,
-                    next_start_dt,
-                    next_end_dt,
-                ) = await get_hist(
-                    timeframe,
-                    start_dt=start_dt,
-                    end_dt=end_dt,
-                )
-
-                # XXX TODO: pretty sure if i plot tsla, btcusdt.binance
-                # and mnq.cme.ib this causes a Qt crash XXDDD
-
-                # make sure we don't overrun the buffer start
-                len_to_push: int = min(iend, array.size)
-                to_push: np.ndarray = array[-len_to_push:]
-                await shm_push_in_between(
-                    shm,
-                    to_push,
-                    prepend_index=iend,
-                    update_start_on_prepend=False,
-                )
-
-                # TODO: UI side needs IPC event to update..
-                # - make sure the UI actually always handles
-                #  this update!
-                # - remember that in the display side, only refersh this
-                #   if the respective history is actually "in view".
-                #   loop
-                await sampler_stream.send({
-                    'broadcast_all': {
-                        'backfilling': (mkt.fqme, timeframe),
-                    },
-                })
-                gap_indices: tuple | None = detect_null_time_gap(shm)
+            # TODO: ideally these can never exist!
+            # -[ ] somehow it seems sometimes we're writing zero-ed
+            #    segments to tsdbs during teardown?
+            # -[ ] can we ensure that the backcfiller tasks do this
+            #    work PREVENTAVELY instead?
+            # -[ ] fill in non-zero epoch time values ALWAYS!
+            await maybe_fill_null_segments(
+                shm=shm,
+                timeframe=timeframe,
+                get_hist=get_hist,
+                sampler_stream=sampler_stream,
+                mkt=mkt,
+            )
 
         # XXX: extremely important, there can be no checkpoints
         # in the block above to avoid entering new ``frames``
@@ -679,28 +725,11 @@ async def tsdb_backfill(
         # there's no backfilling possible.
         except DataUnavailable:
             task_status.started()
-            await tractor.pause()
-            return
 
-        # TODO: fill in non-zero epoch time values ALWAYS!
-        # hist_shm._array['time'] = np.arange(
-        #     start=
-
-        # NOTE: removed for now since it'll always break
-        # on the first 60s of the venue open..
-        # times: np.ndarray = array['time']
-        # # sample period step size in seconds
-        # step_size_s = (
-        #     from_timestamp(times[-1])
-        #     - from_timestamp(times[-2])
-        # ).seconds
-
-        # if step_size_s not in (1, 60):
-        #     log.error(f'Last 2 sample period is off!? -> {step_size_s}')
-        #     step_size_s = (
-        #         from_timestamp(times[-2])
-        #         - from_timestamp(times[-3])
-        #     ).seconds
+            if timeframe > 1:
+                await tractor.pause()
+
+            return
 
         # NOTE: on the first history, most recent history
         # frame we PREPEND from the current shm ._last index