WIP
This commit is contained in:
@@ -34,13 +34,13 @@ pub async fn dyn_events_stream(
|
||||
open_bytes: OpenBoxedBytesStreamsBox,
|
||||
) -> Result<DynEventsStream, Error> {
|
||||
trace!("dyn_events_stream {}", evq.summary_short());
|
||||
use query::api4::events::EventsSubQuerySettings;
|
||||
let subq = make_sub_query(
|
||||
ch_conf,
|
||||
evq.range().clone(),
|
||||
evq.one_before_range(),
|
||||
evq.transform().clone(),
|
||||
evq.test_do_wasm(),
|
||||
evq,
|
||||
EventsSubQuerySettings::from(evq),
|
||||
evq.log_level().into(),
|
||||
ctx,
|
||||
);
|
||||
|
||||
@@ -36,6 +36,7 @@ use query::transform::TransformQuery;
|
||||
use serde::de::DeserializeOwned;
|
||||
use std::fmt;
|
||||
use std::pin::Pin;
|
||||
use std::sync::Arc;
|
||||
use tokio::io::AsyncWriteExt;
|
||||
use tokio::net::TcpStream;
|
||||
|
||||
@@ -45,11 +46,12 @@ pub trait OpenBoxedBytesStreams {
|
||||
fn open(
|
||||
&self,
|
||||
subq: EventsSubQuery,
|
||||
// TODO take by Arc
|
||||
ctx: ReqCtx,
|
||||
) -> Pin<Box<dyn Future<Output = Result<Vec<BoxedBytesStream>, Error>> + Send>>;
|
||||
}
|
||||
|
||||
pub type OpenBoxedBytesStreamsBox = Pin<Box<dyn OpenBoxedBytesStreams + Send>>;
|
||||
pub type OpenBoxedBytesStreamsBox = Pin<Arc<dyn OpenBoxedBytesStreams + Send + Sync>>;
|
||||
|
||||
pub fn make_node_command_frame(query: EventsSubQuery) -> Result<EventQueryJsonStringFrame, Error> {
|
||||
let obj = Frame1Parts::new(query);
|
||||
@@ -202,7 +204,6 @@ pub fn make_sub_query<SUB>(
|
||||
range: SeriesRange,
|
||||
one_before_range: bool,
|
||||
transform: TransformQuery,
|
||||
test_do_wasm: Option<&str>,
|
||||
sub: SUB,
|
||||
log_level: String,
|
||||
ctx: &ReqCtx,
|
||||
@@ -210,8 +211,8 @@ pub fn make_sub_query<SUB>(
|
||||
where
|
||||
SUB: Into<EventsSubQuerySettings>,
|
||||
{
|
||||
let mut select = EventsSubQuerySelect::new(ch_conf, range, one_before_range, transform);
|
||||
if let Some(wasm1) = test_do_wasm {
|
||||
let mut select = EventsSubQuerySelect::new(ch_conf, range, one_before_range, transform.clone());
|
||||
if let Some(wasm1) = transform.do_wasm() {
|
||||
select.set_wasm1(wasm1.into());
|
||||
}
|
||||
let settings = sub.into();
|
||||
|
||||
@@ -45,7 +45,7 @@ fn merge_mergeable_00() -> Result<(), Error> {
|
||||
let fut = async {
|
||||
let inp0 = inmem_test_events_d0_i32_00();
|
||||
let inp1 = inmem_test_events_d0_i32_01();
|
||||
let _merger = items_2::merger::Merger::new(vec![inp0, inp1], 4);
|
||||
let _merger = items_2::merger::Merger::new(vec![inp0, inp1], Some(4));
|
||||
Ok(())
|
||||
};
|
||||
runfut(fut)
|
||||
|
||||
@@ -21,6 +21,7 @@ use netpod::Shape;
|
||||
use query::api4::events::EventsSubQuery;
|
||||
use query::api4::events::PlainEventsQuery;
|
||||
use std::pin::Pin;
|
||||
use std::sync::Arc;
|
||||
|
||||
#[test]
|
||||
fn merged_events_cbor() {
|
||||
@@ -46,7 +47,7 @@ async fn merged_events_inner() -> Result<(), Error> {
|
||||
));
|
||||
let evq = PlainEventsQuery::new(channel, range);
|
||||
let open_bytes = StreamOpener::new();
|
||||
let open_bytes = Box::pin(open_bytes);
|
||||
let open_bytes = Arc::pin(open_bytes);
|
||||
let stream = plain_events_cbor_stream(&evq, ch_conf.clone().into(), &ctx, open_bytes)
|
||||
.await
|
||||
.unwrap();
|
||||
|
||||
@@ -1,8 +1,10 @@
|
||||
mod basic;
|
||||
mod cached;
|
||||
pub mod cached;
|
||||
mod fromlayers;
|
||||
mod gapfill;
|
||||
mod grid;
|
||||
|
||||
pub(super) use basic::TimeBinnedStream;
|
||||
pub(super) use fromlayers::TimeBinnedFromLayers;
|
||||
|
||||
pub use cached::reader::CacheReadProvider;
|
||||
|
||||
@@ -252,6 +252,7 @@ where
|
||||
trace2!("================= POLL");
|
||||
loop {
|
||||
break if self.complete {
|
||||
error!("TimeBinnedStream poll on complete");
|
||||
panic!("TimeBinnedStream poll on complete")
|
||||
} else if self.done {
|
||||
self.complete = true;
|
||||
|
||||
@@ -8,6 +8,7 @@ use netpod::DtMs;
|
||||
use netpod::TsNano;
|
||||
use std::future::Future;
|
||||
use std::pin::Pin;
|
||||
use std::sync::Arc;
|
||||
use std::task::Context;
|
||||
use std::task::Poll;
|
||||
|
||||
@@ -23,16 +24,18 @@ impl Future for Reading {
|
||||
}
|
||||
}
|
||||
|
||||
pub trait CacheReadProvider: Send {
|
||||
pub trait CacheReadProvider: Send + Sync {
|
||||
fn read(&self) -> Reading;
|
||||
}
|
||||
|
||||
#[derive(Debug, ThisError)]
|
||||
#[cstm(name = "BinCachedReader")]
|
||||
pub enum Error {}
|
||||
pub enum Error {
|
||||
TodoImpl,
|
||||
}
|
||||
|
||||
pub struct CachedReader {
|
||||
cache_read_provider: Box<dyn CacheReadProvider>,
|
||||
cache_read_provider: Arc<dyn CacheReadProvider>,
|
||||
}
|
||||
|
||||
impl CachedReader {
|
||||
@@ -40,7 +43,7 @@ impl CachedReader {
|
||||
series: u64,
|
||||
bin_len: DtMs,
|
||||
range: BinnedRange<TsNano>,
|
||||
cache_read_provider: Box<dyn CacheReadProvider>,
|
||||
cache_read_provider: Arc<dyn CacheReadProvider>,
|
||||
) -> Result<Self, Error> {
|
||||
let ret = Self { cache_read_provider };
|
||||
Ok(ret)
|
||||
@@ -52,6 +55,7 @@ impl Stream for CachedReader {
|
||||
|
||||
fn poll_next(mut self: Pin<&mut Self>, cx: &mut Context) -> Poll<Option<Self::Item>> {
|
||||
use Poll::*;
|
||||
// Ready(Some(Err(Error::TodoImpl)))
|
||||
Ready(None)
|
||||
}
|
||||
}
|
||||
|
||||
@@ -1,4 +1,5 @@
|
||||
use super::cached::reader::CacheReadProvider;
|
||||
use crate::tcprawclient::OpenBoxedBytesStreamsBox;
|
||||
use crate::timebin::grid::find_next_finer_bin_len;
|
||||
use err::thiserror;
|
||||
use err::ThisError;
|
||||
@@ -14,9 +15,14 @@ use items_2::binsdim0::BinsDim0;
|
||||
use netpod::log::*;
|
||||
use netpod::BinnedRange;
|
||||
use netpod::BinnedRangeEnum;
|
||||
use netpod::ChannelTypeConfigGen;
|
||||
use netpod::DtMs;
|
||||
use netpod::ReqCtx;
|
||||
use netpod::TsNano;
|
||||
use query::api4::events::EventsSubQuerySettings;
|
||||
use query::transform::TransformQuery;
|
||||
use std::pin::Pin;
|
||||
use std::sync::Arc;
|
||||
use std::task::Context;
|
||||
use std::task::Poll;
|
||||
|
||||
@@ -30,6 +36,12 @@ pub enum Error {
|
||||
type BoxedInput = Pin<Box<dyn Stream<Item = Sitemty<BinsDim0<f32>>> + Send>>;
|
||||
|
||||
pub struct TimeBinnedFromLayers {
|
||||
ch_conf: ChannelTypeConfigGen,
|
||||
transform_query: TransformQuery,
|
||||
sub: EventsSubQuerySettings,
|
||||
log_level: String,
|
||||
ctx: Arc<ReqCtx>,
|
||||
open_bytes: OpenBoxedBytesStreamsBox,
|
||||
inp: BoxedInput,
|
||||
}
|
||||
|
||||
@@ -39,11 +51,17 @@ impl TimeBinnedFromLayers {
|
||||
}
|
||||
|
||||
pub fn new(
|
||||
ch_conf: ChannelTypeConfigGen,
|
||||
transform_query: TransformQuery,
|
||||
sub: EventsSubQuerySettings,
|
||||
log_level: String,
|
||||
ctx: Arc<ReqCtx>,
|
||||
open_bytes: OpenBoxedBytesStreamsBox,
|
||||
series: u64,
|
||||
range: BinnedRange<TsNano>,
|
||||
do_time_weight: bool,
|
||||
bin_len_layers: Vec<DtMs>,
|
||||
cache_read_provider: Box<dyn CacheReadProvider>,
|
||||
cache_read_provider: Arc<dyn CacheReadProvider + Send>,
|
||||
) -> Result<Self, Error> {
|
||||
info!(
|
||||
"{}::new {:?} {:?} {:?}",
|
||||
@@ -55,8 +73,28 @@ impl TimeBinnedFromLayers {
|
||||
let bin_len = DtMs::from_ms_u64(range.bin_len.ms());
|
||||
if bin_len_layers.contains(&bin_len) {
|
||||
info!("{}::new bin_len in layers", Self::type_name());
|
||||
let inp = super::gapfill::GapFill::new(series, range, do_time_weight, bin_len_layers, cache_read_provider)?;
|
||||
let ret = Self { inp: Box::pin(inp) };
|
||||
let inp = super::gapfill::GapFill::new(
|
||||
ch_conf.clone(),
|
||||
transform_query.clone(),
|
||||
sub.clone(),
|
||||
log_level.clone(),
|
||||
ctx.clone(),
|
||||
open_bytes.clone(),
|
||||
series,
|
||||
range,
|
||||
do_time_weight,
|
||||
bin_len_layers,
|
||||
cache_read_provider,
|
||||
)?;
|
||||
let ret = Self {
|
||||
ch_conf,
|
||||
transform_query,
|
||||
sub,
|
||||
log_level,
|
||||
ctx,
|
||||
open_bytes,
|
||||
inp: Box::pin(inp),
|
||||
};
|
||||
Ok(ret)
|
||||
} else {
|
||||
match find_next_finer_bin_len(bin_len, &bin_len_layers) {
|
||||
@@ -64,8 +102,14 @@ impl TimeBinnedFromLayers {
|
||||
// TODO
|
||||
// produce from binned sub-stream with additional binner.
|
||||
let range = BinnedRange::from_nano_range(range.to_nano_range(), finer);
|
||||
info!("{}::new next finer {:?} {:?}", Self::type_name(), finer, range);
|
||||
warn!("{}::new next finer {:?} {:?}", Self::type_name(), finer, range);
|
||||
let inp = super::gapfill::GapFill::new(
|
||||
ch_conf.clone(),
|
||||
transform_query.clone(),
|
||||
sub.clone(),
|
||||
log_level.clone(),
|
||||
ctx.clone(),
|
||||
open_bytes.clone(),
|
||||
series,
|
||||
range.clone(),
|
||||
do_time_weight,
|
||||
@@ -77,11 +121,19 @@ impl TimeBinnedFromLayers {
|
||||
BinnedRangeEnum::Time(range),
|
||||
do_time_weight,
|
||||
);
|
||||
let ret = Self { inp: Box::pin(inp) };
|
||||
let ret = Self {
|
||||
ch_conf,
|
||||
transform_query,
|
||||
sub,
|
||||
log_level,
|
||||
ctx,
|
||||
open_bytes,
|
||||
inp: Box::pin(inp),
|
||||
};
|
||||
Ok(ret)
|
||||
}
|
||||
None => {
|
||||
info!("{}::new NO next finer", Self::type_name());
|
||||
warn!("{}::new NO next finer", Self::type_name());
|
||||
// TODO
|
||||
// produce from events
|
||||
todo!()
|
||||
@@ -94,7 +146,12 @@ impl TimeBinnedFromLayers {
|
||||
impl Stream for TimeBinnedFromLayers {
|
||||
type Item = Sitemty<BinsDim0<f32>>;
|
||||
|
||||
fn poll_next(self: Pin<&mut Self>, cx: &mut Context) -> Poll<Option<Self::Item>> {
|
||||
todo!()
|
||||
fn poll_next(mut self: Pin<&mut Self>, cx: &mut Context) -> Poll<Option<Self::Item>> {
|
||||
use Poll::*;
|
||||
match self.inp.poll_next_unpin(cx) {
|
||||
Ready(Some(x)) => Ready(Some(x)),
|
||||
Ready(None) => Ready(None),
|
||||
Pending => Pending,
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
@@ -1,14 +1,24 @@
|
||||
use super::cached::reader::CacheReadProvider;
|
||||
use crate::tcprawclient::OpenBoxedBytesStreamsBox;
|
||||
use err::thiserror;
|
||||
use err::ThisError;
|
||||
use futures_util::Stream;
|
||||
use futures_util::TryStreamExt;
|
||||
use futures_util::StreamExt;
|
||||
use items_0::streamitem::RangeCompletableItem;
|
||||
use items_0::streamitem::Sitemty;
|
||||
use items_0::streamitem::StreamItem;
|
||||
use items_2::binsdim0::BinsDim0;
|
||||
use netpod::log::*;
|
||||
use netpod::range::evrange::NanoRange;
|
||||
use netpod::BinnedRange;
|
||||
use netpod::ChannelTypeConfigGen;
|
||||
use netpod::DtMs;
|
||||
use netpod::ReqCtx;
|
||||
use netpod::TsNano;
|
||||
use query::api4::events::EventsSubQuerySettings;
|
||||
use query::transform::TransformQuery;
|
||||
use std::pin::Pin;
|
||||
use std::sync::Arc;
|
||||
use std::task::Context;
|
||||
use std::task::Poll;
|
||||
|
||||
@@ -16,32 +26,201 @@ use std::task::Poll;
|
||||
#[cstm(name = "BinCachedGapFill")]
|
||||
pub enum Error {
|
||||
CacheReader(#[from] super::cached::reader::Error),
|
||||
GapFromFiner,
|
||||
}
|
||||
|
||||
type INP = Pin<Box<dyn Stream<Item = Result<BinsDim0<f32>, Error>> + Send>>;
|
||||
type INP = Pin<Box<dyn Stream<Item = Sitemty<BinsDim0<f32>>> + Send>>;
|
||||
|
||||
// Try to read from cache for the given bin len.
|
||||
// For gaps in the stream, construct an alternative input from finer bin len with a binner.
|
||||
pub struct GapFill {
|
||||
ch_conf: ChannelTypeConfigGen,
|
||||
transform_query: TransformQuery,
|
||||
sub: EventsSubQuerySettings,
|
||||
log_level: String,
|
||||
ctx: Arc<ReqCtx>,
|
||||
open_bytes: OpenBoxedBytesStreamsBox,
|
||||
series: u64,
|
||||
range: BinnedRange<TsNano>,
|
||||
do_time_weight: bool,
|
||||
bin_len_layers: Vec<DtMs>,
|
||||
inp: INP,
|
||||
inp_buf: Option<BinsDim0<f32>>,
|
||||
inp_finer: Option<INP>,
|
||||
last_bin_ts2: Option<TsNano>,
|
||||
exp_finer_range: NanoRange,
|
||||
cache_read_provider: Arc<dyn CacheReadProvider>,
|
||||
}
|
||||
|
||||
impl GapFill {
|
||||
// bin_len of the given range must be a cacheable bin_len.
|
||||
pub fn new(
|
||||
ch_conf: ChannelTypeConfigGen,
|
||||
transform_query: TransformQuery,
|
||||
sub: EventsSubQuerySettings,
|
||||
log_level: String,
|
||||
ctx: Arc<ReqCtx>,
|
||||
open_bytes: OpenBoxedBytesStreamsBox,
|
||||
|
||||
series: u64,
|
||||
range: BinnedRange<TsNano>,
|
||||
do_time_weight: bool,
|
||||
bin_len_layers: Vec<DtMs>,
|
||||
cache_read_provider: Box<dyn CacheReadProvider>,
|
||||
cache_read_provider: Arc<dyn CacheReadProvider>,
|
||||
) -> Result<Self, Error> {
|
||||
// super::fromlayers::TimeBinnedFromLayers::new(series, range, do_time_weight, bin_len_layers)?;
|
||||
let inp =
|
||||
super::cached::reader::CachedReader::new(series, range.bin_len.to_dt_ms(), range, cache_read_provider)?
|
||||
.map_err(Error::from);
|
||||
let ret = Self { inp: Box::pin(inp) };
|
||||
let inp = super::cached::reader::CachedReader::new(
|
||||
series,
|
||||
range.bin_len.to_dt_ms(),
|
||||
range.clone(),
|
||||
cache_read_provider.clone(),
|
||||
)?
|
||||
.map(|x| match x {
|
||||
Ok(x) => Ok(StreamItem::DataItem(RangeCompletableItem::Data(x))),
|
||||
Err(e) => Err(::err::Error::from_string(e)),
|
||||
});
|
||||
let ret = Self {
|
||||
ch_conf,
|
||||
transform_query,
|
||||
sub,
|
||||
log_level,
|
||||
ctx,
|
||||
open_bytes,
|
||||
series,
|
||||
range,
|
||||
do_time_weight,
|
||||
bin_len_layers,
|
||||
inp: Box::pin(inp),
|
||||
inp_buf: None,
|
||||
inp_finer: None,
|
||||
last_bin_ts2: None,
|
||||
// TODO just dummy:
|
||||
exp_finer_range: NanoRange { beg: 0, end: 0 },
|
||||
cache_read_provider,
|
||||
};
|
||||
Ok(ret)
|
||||
}
|
||||
|
||||
fn handle_bins_finer(mut self: Pin<&mut Self>, bins: BinsDim0<f32>) -> Result<BinsDim0<f32>, Error> {
|
||||
for (&ts1, &ts2) in bins.ts1s.iter().zip(&bins.ts2s) {
|
||||
if let Some(last) = self.last_bin_ts2 {
|
||||
if ts1 != last.ns() {
|
||||
return Err(Error::GapFromFiner);
|
||||
}
|
||||
}
|
||||
self.last_bin_ts2 = Some(TsNano::from_ns(ts2));
|
||||
}
|
||||
|
||||
// TODO keep bins from finer source.
|
||||
// Only write bins to cache if we receive another
|
||||
|
||||
// TODO make sure that input does not send "made-up" empty future bins.
|
||||
// On the other hand, if the request is over past range, but the channel was silent ever since?
|
||||
// Then we should in principle know that from is-alive status checking.
|
||||
// So, until then, allow made-up bins?
|
||||
// Maybe, for now, only write those bins before some last non-zero-count bin. The only safe way.
|
||||
|
||||
Ok(bins)
|
||||
}
|
||||
|
||||
fn handle_bins(mut self: Pin<&mut Self>, bins: BinsDim0<f32>) -> Result<BinsDim0<f32>, Error> {
|
||||
// TODO could use an interface to iterate over opaque bin items that only expose
|
||||
// edge and count information with all remaining values opaque.
|
||||
for (i, (&ts1, &ts2)) in bins.ts1s.iter().zip(&bins.ts2s).enumerate() {
|
||||
if let Some(last) = self.last_bin_ts2 {
|
||||
if ts1 != last.ns() {
|
||||
let mut ret = <BinsDim0<f32> as items_0::Empty>::empty();
|
||||
let mut bins = bins;
|
||||
bins.drain_into(&mut ret, 0..i);
|
||||
self.inp_buf = Some(bins);
|
||||
let range = NanoRange {
|
||||
beg: last.ns(),
|
||||
end: ts1,
|
||||
};
|
||||
self.setup_inp_finer(range)?;
|
||||
return Ok(ret);
|
||||
}
|
||||
}
|
||||
self.last_bin_ts2 = Some(TsNano::from_ns(ts2));
|
||||
}
|
||||
Ok(bins)
|
||||
}
|
||||
|
||||
fn setup_inp_finer(mut self: Pin<&mut Self>, range: NanoRange) -> Result<(), Error> {
|
||||
// Set up range to fill from finer.
|
||||
self.exp_finer_range = range.clone();
|
||||
if let Some(bin_len_finer) =
|
||||
super::grid::find_next_finer_bin_len(self.range.bin_len.to_dt_ms(), &self.bin_len_layers)
|
||||
{
|
||||
let range_finer = BinnedRange::from_nano_range(range, bin_len_finer);
|
||||
let inp_finer = GapFill::new(
|
||||
self.ch_conf.clone(),
|
||||
self.transform_query.clone(),
|
||||
self.sub.clone(),
|
||||
self.log_level.clone(),
|
||||
self.ctx.clone(),
|
||||
self.open_bytes.clone(),
|
||||
self.series,
|
||||
range_finer.clone(),
|
||||
self.do_time_weight,
|
||||
self.bin_len_layers.clone(),
|
||||
self.cache_read_provider.clone(),
|
||||
)?;
|
||||
let stream = Box::pin(inp_finer);
|
||||
let do_time_weight = self.do_time_weight;
|
||||
let range = BinnedRange::from_nano_range(range_finer.full_range(), self.range.bin_len.to_dt_ms());
|
||||
let stream =
|
||||
super::basic::TimeBinnedStream::new(stream, netpod::BinnedRangeEnum::Time(range), do_time_weight);
|
||||
self.inp_finer = Some(Box::pin(stream));
|
||||
} else {
|
||||
let do_time_weight = self.do_time_weight;
|
||||
let one_before_range = true;
|
||||
let range = BinnedRange::from_nano_range(range, self.range.bin_len.to_dt_ms());
|
||||
let stream = crate::timebinnedjson::TimeBinnableStream::new(
|
||||
range.full_range(),
|
||||
one_before_range,
|
||||
self.ch_conf.clone(),
|
||||
self.transform_query.clone(),
|
||||
self.sub.clone(),
|
||||
self.log_level.clone(),
|
||||
self.ctx.clone(),
|
||||
self.open_bytes.clone(),
|
||||
);
|
||||
// let stream: Pin<Box<dyn items_0::transform::TimeBinnableStreamTrait>> = stream;
|
||||
let stream = Box::pin(stream);
|
||||
// TODO rename TimeBinnedStream to make it more clear that it is the component which initiates the time binning.
|
||||
let stream =
|
||||
super::basic::TimeBinnedStream::new(stream, netpod::BinnedRangeEnum::Time(range), do_time_weight);
|
||||
let stream = stream.map(|item| match item {
|
||||
Ok(x) => match x {
|
||||
StreamItem::DataItem(x) => match x {
|
||||
RangeCompletableItem::Data(mut x) => {
|
||||
// TODO need a typed time binner
|
||||
if let Some(x) = x.as_any_mut().downcast_mut::<BinsDim0<f32>>() {
|
||||
let y = x.clone();
|
||||
Ok(StreamItem::DataItem(RangeCompletableItem::Data(y)))
|
||||
} else {
|
||||
Err(::err::Error::with_msg_no_trace(
|
||||
"GapFill expects incoming BinsDim0<f32>",
|
||||
))
|
||||
}
|
||||
}
|
||||
RangeCompletableItem::RangeComplete => {
|
||||
Ok(StreamItem::DataItem(RangeCompletableItem::RangeComplete))
|
||||
}
|
||||
},
|
||||
StreamItem::Log(x) => Ok(StreamItem::Log(x)),
|
||||
StreamItem::Stats(x) => Ok(StreamItem::Stats(x)),
|
||||
},
|
||||
Err(e) => Err(e),
|
||||
});
|
||||
// let stream: Pin<
|
||||
// Box<dyn Stream<Item = Sitemty<Box<dyn items_0::timebin::TimeBinned>>> + Send>,
|
||||
// > = Box::pin(stream);
|
||||
self.inp_finer = Some(Box::pin(stream));
|
||||
}
|
||||
Ok(())
|
||||
}
|
||||
}
|
||||
|
||||
impl Stream for GapFill {
|
||||
@@ -49,6 +228,101 @@ impl Stream for GapFill {
|
||||
|
||||
fn poll_next(mut self: Pin<&mut Self>, cx: &mut Context) -> Poll<Option<Self::Item>> {
|
||||
use Poll::*;
|
||||
loop {
|
||||
break if let Some(inp_finer) = self.inp_finer.as_mut() {
|
||||
// TODO
|
||||
// detect also gaps here: if gap from finer, then error.
|
||||
// on CacheUsage Use or Rereate:
|
||||
// write these bins to cache because we did not find them in cache before.
|
||||
match inp_finer.poll_next_unpin(cx) {
|
||||
Ready(Some(Ok(x))) => match x {
|
||||
StreamItem::DataItem(RangeCompletableItem::Data(x)) => {
|
||||
match self.as_mut().handle_bins_finer(x) {
|
||||
Ok(x) => Ready(Some(Ok(StreamItem::DataItem(RangeCompletableItem::Data(x))))),
|
||||
Err(e) => Ready(Some(Err(::err::Error::from_string(e)))),
|
||||
}
|
||||
}
|
||||
StreamItem::DataItem(RangeCompletableItem::RangeComplete) => {
|
||||
Ready(Some(Ok(StreamItem::DataItem(RangeCompletableItem::RangeComplete))))
|
||||
}
|
||||
StreamItem::Log(x) => Ready(Some(Ok(StreamItem::Log(x)))),
|
||||
StreamItem::Stats(x) => Ready(Some(Ok(StreamItem::Stats(x)))),
|
||||
},
|
||||
Ready(Some(Err(e))) => Ready(Some(Err(::err::Error::from_string(e)))),
|
||||
Ready(None) => {
|
||||
if let Some(j) = self.last_bin_ts2 {
|
||||
if j.ns() != self.exp_finer_range.end() {
|
||||
Ready(Some(Err(::err::Error::from_string(
|
||||
"finer input didn't deliver to the end",
|
||||
))))
|
||||
} else {
|
||||
self.last_bin_ts2 = None;
|
||||
self.exp_finer_range = NanoRange { beg: 0, end: 0 };
|
||||
self.inp_finer = None;
|
||||
continue;
|
||||
}
|
||||
} else {
|
||||
Ready(Some(Err(::err::Error::from_string("finer input delivered nothing"))))
|
||||
}
|
||||
}
|
||||
Pending => Pending,
|
||||
}
|
||||
} else if let Some(x) = self.inp_buf.take() {
|
||||
match self.as_mut().handle_bins_finer(x) {
|
||||
Ok(x) => Ready(Some(Ok(StreamItem::DataItem(RangeCompletableItem::Data(x))))),
|
||||
Err(e) => Ready(Some(Err(::err::Error::from_string(e)))),
|
||||
}
|
||||
} else {
|
||||
match self.inp.poll_next_unpin(cx) {
|
||||
Ready(Some(Ok(x))) => match x {
|
||||
StreamItem::DataItem(RangeCompletableItem::Data(x)) => match self.as_mut().handle_bins(x) {
|
||||
Ok(x) => Ready(Some(Ok(StreamItem::DataItem(RangeCompletableItem::Data(x))))),
|
||||
Err(e) => Ready(Some(Err(::err::Error::from_string(e)))),
|
||||
},
|
||||
StreamItem::DataItem(RangeCompletableItem::RangeComplete) => {
|
||||
Ready(Some(Ok(StreamItem::DataItem(RangeCompletableItem::RangeComplete))))
|
||||
}
|
||||
StreamItem::Log(x) => Ready(Some(Ok(StreamItem::Log(x)))),
|
||||
StreamItem::Stats(x) => Ready(Some(Ok(StreamItem::Stats(x)))),
|
||||
},
|
||||
Ready(Some(Err(e))) => Ready(Some(Err(::err::Error::from_string(e)))),
|
||||
Ready(None) => {
|
||||
// TODO assert that we have emitted up to the requested range.
|
||||
// If not, request the remaining range from "finer" input.
|
||||
if let Some(j) = self.last_bin_ts2 {
|
||||
if j.ns() != self.exp_finer_range.end() {
|
||||
let range = NanoRange {
|
||||
beg: j.ns(),
|
||||
end: self.range.full_range().end(),
|
||||
};
|
||||
match self.as_mut().setup_inp_finer(range) {
|
||||
Ok(()) => {
|
||||
continue;
|
||||
}
|
||||
Err(e) => Ready(Some(Err(::err::Error::from_string(e)))),
|
||||
}
|
||||
} else {
|
||||
// self.last_bin_ts2 = None;
|
||||
// self.exp_finer_range = NanoRange { beg: 0, end: 0 };
|
||||
// self.inp_finer = None;
|
||||
// continue;
|
||||
Ready(None)
|
||||
}
|
||||
} else {
|
||||
warn!("----- NOTHING IN CACHE, SETUP FULL FROM FINER");
|
||||
let range = self.range.full_range();
|
||||
match self.as_mut().setup_inp_finer(range) {
|
||||
Ok(()) => {
|
||||
continue;
|
||||
}
|
||||
Err(e) => Ready(Some(Err(::err::Error::from_string(e)))),
|
||||
}
|
||||
}
|
||||
}
|
||||
Pending => Pending,
|
||||
}
|
||||
};
|
||||
}
|
||||
// When do we detect a gap:
|
||||
// - when the current item poses a gap to the last.
|
||||
// - when we see EOS before the requested range is filled.
|
||||
@@ -59,12 +333,12 @@ impl Stream for GapFill {
|
||||
// When a gap is detected:
|
||||
// - buffer the current item, if there is one (can also be EOS).
|
||||
// - create a new producer of bin:
|
||||
// - FromFiner(series, bin_len, range)
|
||||
// - GapFillwith finer range? FromFiner(series, bin_len, range) ?
|
||||
// - TimeBinnedFromLayers for a bin_len in layers would also go directly into GapFill.
|
||||
// what does FromFiner bring to the table?
|
||||
// It does not attempt to read the given bin-len from a cache, because we just did attempt that.
|
||||
// It still requires that bin-len is cacheable. (NO! it must work with the layering that I passed!)
|
||||
// Then it finds the next cacheable
|
||||
// Ready(None)
|
||||
todo!("poll the already created cached reader, detect and fill in gaps, send off to cache-write")
|
||||
}
|
||||
}
|
||||
|
||||
@@ -3,11 +3,14 @@ use crate::rangefilter2::RangeFilter2;
|
||||
use crate::tcprawclient::container_stream_from_bytes_stream;
|
||||
use crate::tcprawclient::make_sub_query;
|
||||
use crate::tcprawclient::OpenBoxedBytesStreamsBox;
|
||||
use crate::timebin::CacheReadProvider;
|
||||
use crate::timebin::TimeBinnedStream;
|
||||
use crate::transform::build_merged_event_transform;
|
||||
use crate::transform::EventsToTimeBinnable;
|
||||
use err::Error;
|
||||
use futures_util::future::BoxFuture;
|
||||
use futures_util::Future;
|
||||
use futures_util::FutureExt;
|
||||
use futures_util::Stream;
|
||||
use futures_util::StreamExt;
|
||||
use items_0::collect_s::Collectable;
|
||||
@@ -15,6 +18,7 @@ use items_0::on_sitemty_data;
|
||||
use items_0::streamitem::RangeCompletableItem;
|
||||
use items_0::streamitem::Sitemty;
|
||||
use items_0::streamitem::StreamItem;
|
||||
use items_0::timebin::TimeBinnable;
|
||||
use items_0::timebin::TimeBinned;
|
||||
use items_0::transform::TimeBinnableStreamBox;
|
||||
use items_0::transform::TimeBinnableStreamTrait;
|
||||
@@ -30,8 +34,13 @@ use netpod::ChannelTypeConfigGen;
|
||||
use netpod::DtMs;
|
||||
use netpod::ReqCtx;
|
||||
use query::api4::binned::BinnedQuery;
|
||||
use query::api4::events::EventsSubQuerySettings;
|
||||
use query::transform::TransformQuery;
|
||||
use serde_json::Value as JsonValue;
|
||||
use std::pin::Pin;
|
||||
use std::sync::Arc;
|
||||
use std::task::Context;
|
||||
use std::task::Poll;
|
||||
use std::time::Duration;
|
||||
use std::time::Instant;
|
||||
|
||||
@@ -40,28 +49,30 @@ fn assert_stream_send<'u, R>(stream: impl 'u + Send + Stream<Item = R>) -> impl
|
||||
stream
|
||||
}
|
||||
|
||||
async fn timebinnable_stream(
|
||||
query: BinnedQuery,
|
||||
// TODO factor out, it is use now also from GapFill.
|
||||
pub async fn timebinnable_stream(
|
||||
range: NanoRange,
|
||||
one_before_range: bool,
|
||||
ch_conf: ChannelTypeConfigGen,
|
||||
ctx: &ReqCtx,
|
||||
transform_query: TransformQuery,
|
||||
sub: EventsSubQuerySettings,
|
||||
log_level: String,
|
||||
ctx: Arc<ReqCtx>,
|
||||
open_bytes: OpenBoxedBytesStreamsBox,
|
||||
) -> Result<TimeBinnableStreamBox, Error> {
|
||||
let subq = make_sub_query(
|
||||
ch_conf,
|
||||
range.clone().into(),
|
||||
one_before_range,
|
||||
query.transform().clone(),
|
||||
query.test_do_wasm(),
|
||||
&query,
|
||||
query.log_level().into(),
|
||||
ctx,
|
||||
transform_query,
|
||||
sub.clone(),
|
||||
log_level.clone(),
|
||||
&ctx,
|
||||
);
|
||||
let inmem_bufcap = subq.inmem_bufcap();
|
||||
let _wasm1 = subq.wasm1().map(ToString::to_string);
|
||||
let mut tr = build_merged_event_transform(subq.transform())?;
|
||||
let bytes_streams = open_bytes.open(subq, ctx.clone()).await?;
|
||||
let bytes_streams = open_bytes.open(subq, ctx.as_ref().clone()).await?;
|
||||
let mut inps = Vec::new();
|
||||
for s in bytes_streams {
|
||||
let s = container_stream_from_bytes_stream::<ChannelEvents>(s, inmem_bufcap.clone(), "TODOdbgdesc".into())?;
|
||||
@@ -70,7 +81,7 @@ async fn timebinnable_stream(
|
||||
}
|
||||
// TODO propagate also the max-buf-len for the first stage event reader.
|
||||
// TODO use a mixture of count and byte-size as threshold.
|
||||
let stream = Merger::new(inps, query.merger_out_len_max());
|
||||
let stream = Merger::new(inps, sub.merger_out_len_max());
|
||||
|
||||
let stream = RangeFilter2::new(stream, range, one_before_range);
|
||||
|
||||
@@ -221,16 +232,88 @@ async fn timebinnable_stream(
|
||||
Ok(TimeBinnableStreamBox(stream))
|
||||
}
|
||||
|
||||
pub struct TimeBinnableStream {
|
||||
make_stream_fut: Option<Pin<Box<dyn Future<Output = Result<TimeBinnableStreamBox, Error>> + Send>>>,
|
||||
stream: Option<Pin<Box<dyn Stream<Item = Sitemty<Box<dyn TimeBinnable>>> + Send>>>,
|
||||
}
|
||||
|
||||
impl TimeBinnableStream {
|
||||
pub fn new(
|
||||
range: NanoRange,
|
||||
one_before_range: bool,
|
||||
ch_conf: ChannelTypeConfigGen,
|
||||
transform_query: TransformQuery,
|
||||
sub: EventsSubQuerySettings,
|
||||
log_level: String,
|
||||
// TODO take by Arc ref
|
||||
ctx: Arc<ReqCtx>,
|
||||
open_bytes: OpenBoxedBytesStreamsBox,
|
||||
) -> Self {
|
||||
let fut = timebinnable_stream(
|
||||
range,
|
||||
one_before_range,
|
||||
ch_conf,
|
||||
transform_query,
|
||||
sub,
|
||||
log_level,
|
||||
ctx,
|
||||
open_bytes,
|
||||
);
|
||||
let fut = Box::pin(fut);
|
||||
Self {
|
||||
make_stream_fut: Some(fut),
|
||||
stream: None,
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
// impl WithTransformProperties + Send
|
||||
|
||||
impl Stream for TimeBinnableStream {
|
||||
type Item = Sitemty<Box<dyn TimeBinnable>>;
|
||||
|
||||
fn poll_next(mut self: Pin<&mut Self>, cx: &mut Context) -> Poll<Option<Self::Item>> {
|
||||
use Poll::*;
|
||||
loop {
|
||||
break if let Some(fut) = self.make_stream_fut.as_mut() {
|
||||
match fut.poll_unpin(cx) {
|
||||
Ready(x) => match x {
|
||||
Ok(x) => {
|
||||
self.make_stream_fut = None;
|
||||
self.stream = Some(Box::pin(x));
|
||||
continue;
|
||||
}
|
||||
Err(e) => Ready(Some(Err(e))),
|
||||
},
|
||||
Pending => Pending,
|
||||
}
|
||||
} else if let Some(fut) = self.stream.as_mut() {
|
||||
match fut.poll_next_unpin(cx) {
|
||||
Ready(Some(x)) => Ready(Some(x)),
|
||||
Ready(None) => {
|
||||
self.stream = None;
|
||||
Ready(None)
|
||||
}
|
||||
Pending => Pending,
|
||||
}
|
||||
} else {
|
||||
Ready(None)
|
||||
};
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
async fn timebinned_stream(
|
||||
query: BinnedQuery,
|
||||
binned_range: BinnedRangeEnum,
|
||||
ch_conf: ChannelTypeConfigGen,
|
||||
ctx: &ReqCtx,
|
||||
open_bytes: OpenBoxedBytesStreamsBox,
|
||||
cache_read_provider: Option<Arc<dyn CacheReadProvider>>,
|
||||
) -> Result<Pin<Box<dyn Stream<Item = Sitemty<Box<dyn TimeBinned>>> + Send>>, Error> {
|
||||
use netpod::query::CacheUsage;
|
||||
match query.cache_usage() {
|
||||
CacheUsage::Use | CacheUsage::Recreate => {
|
||||
match (query.cache_usage(), cache_read_provider) {
|
||||
(CacheUsage::Use | CacheUsage::Recreate, Some(cache_read_provider)) => {
|
||||
let series = if let Some(x) = query.channel().series() {
|
||||
x
|
||||
} else {
|
||||
@@ -256,8 +339,13 @@ async fn timebinned_stream(
|
||||
// DtMs::from_ms_u64(1000 * 10),
|
||||
]
|
||||
};
|
||||
let cache_read_provider = err::todoval();
|
||||
let stream = crate::timebin::TimeBinnedFromLayers::new(
|
||||
ch_conf,
|
||||
query.transform().clone(),
|
||||
EventsSubQuerySettings::from(&query),
|
||||
query.log_level().into(),
|
||||
Arc::new(ctx.clone()),
|
||||
open_bytes.clone(),
|
||||
series,
|
||||
binned_range.binned_range_time(),
|
||||
do_time_weight,
|
||||
@@ -273,13 +361,23 @@ async fn timebinned_stream(
|
||||
let stream: Pin<Box<dyn Stream<Item = Sitemty<Box<dyn TimeBinned>>> + Send>> = Box::pin(stream);
|
||||
Ok(stream)
|
||||
}
|
||||
CacheUsage::Ignore => {
|
||||
_ => {
|
||||
let range = binned_range.binned_range_time().to_nano_range();
|
||||
|
||||
let do_time_weight = true;
|
||||
let one_before_range = true;
|
||||
|
||||
let stream = timebinnable_stream(query.clone(), range, one_before_range, ch_conf, ctx, open_bytes).await?;
|
||||
let stream = timebinnable_stream(
|
||||
range,
|
||||
one_before_range,
|
||||
ch_conf,
|
||||
query.transform().clone(),
|
||||
(&query).into(),
|
||||
query.log_level().into(),
|
||||
Arc::new(ctx.clone()),
|
||||
open_bytes,
|
||||
)
|
||||
.await?;
|
||||
let stream: Pin<Box<dyn TimeBinnableStreamTrait>> = stream.0;
|
||||
let stream = Box::pin(stream);
|
||||
// TODO rename TimeBinnedStream to make it more clear that it is the component which initiates the time binning.
|
||||
@@ -309,13 +407,22 @@ pub async fn timebinned_json(
|
||||
ch_conf: ChannelTypeConfigGen,
|
||||
ctx: &ReqCtx,
|
||||
open_bytes: OpenBoxedBytesStreamsBox,
|
||||
cache_read_provider: Option<Arc<dyn CacheReadProvider>>,
|
||||
) -> Result<JsonValue, Error> {
|
||||
let deadline = Instant::now() + query.timeout_content().unwrap_or(Duration::from_millis(5000));
|
||||
let binned_range = BinnedRangeEnum::covering_range(query.range().clone(), query.bin_count())?;
|
||||
// TODO derive better values, from query
|
||||
let collect_max = 10000;
|
||||
let bytes_max = 100 * collect_max;
|
||||
let stream = timebinned_stream(query.clone(), binned_range.clone(), ch_conf, ctx, open_bytes).await?;
|
||||
let stream = timebinned_stream(
|
||||
query.clone(),
|
||||
binned_range.clone(),
|
||||
ch_conf,
|
||||
ctx,
|
||||
open_bytes,
|
||||
cache_read_provider,
|
||||
)
|
||||
.await?;
|
||||
let stream = timebinned_to_collectable(stream);
|
||||
let collected = Collect::new(stream, deadline, collect_max, bytes_max, None, Some(binned_range));
|
||||
let collected: BoxFuture<_> = Box::pin(collected);
|
||||
|
||||
Reference in New Issue
Block a user