use crate::agg::binnedt::TBinnerStream; use crate::binned::binnedfrompbv::FetchedPreBinned; use crate::binned::query::{CacheUsage, PreBinnedQuery}; use crate::binned::WithLen; use crate::cache::{write_pb_cache_min_max_avg_scalar, CacheFileDesc, WrittenPbCache}; use crate::decode::{Endianness, EventValueFromBytes, EventValueShape, NumFromBytes}; use crate::merge::mergedfromremotes::MergedFromRemotes; use crate::streamlog::Streamlog; use err::Error; use futures_core::Stream; use futures_util::{FutureExt, StreamExt}; use items::numops::NumOps; use items::{ Appendable, EventsNodeProcessor, FrameType, PushableIndex, RangeCompletableItem, ReadableFromFile, Sitemty, StreamItem, TimeBinnableType, }; use netpod::log::*; use netpod::query::RawEventsQuery; use netpod::{ x_bin_count, AggKind, BinnedRange, NodeConfigCached, PerfOpts, PreBinnedPatchIterator, PreBinnedPatchRange, Shape, }; use serde::de::DeserializeOwned; use serde::Serialize; use std::future::Future; use std::io; use std::marker::PhantomData; use std::path::PathBuf; use std::pin::Pin; use std::task::{Context, Poll}; use tokio::fs::{File, OpenOptions}; pub struct PreBinnedValueStream where NTY: NumOps + NumFromBytes + Serialize + 'static, END: Endianness + 'static, EVS: EventValueShape + EventValueFromBytes + 'static, ENP: EventsNodeProcessor>::Batch>, { query: PreBinnedQuery, shape: Shape, agg_kind: AggKind, node_config: NodeConfigCached, open_check_local_file: Option> + Send>>>, fut2: Option< Pin::Output as TimeBinnableType>::Output>> + Send>>, >, read_from_cache: bool, cache_written: bool, data_complete: bool, range_complete_observed: bool, range_complete_emitted: bool, errored: bool, completed: bool, streamlog: Streamlog, values: <::Output as TimeBinnableType>::Output, write_fut: Option> + Send>>>, read_cache_fut: Option< Pin< Box< dyn Future::Output as TimeBinnableType>::Output>> + Send, >, >, >, _m1: PhantomData, _m2: PhantomData, _m3: PhantomData, _m4: PhantomData, } impl PreBinnedValueStream where NTY: NumOps + NumFromBytes + Serialize + 'static, END: Endianness + 'static, EVS: EventValueShape + EventValueFromBytes + 'static, ENP: EventsNodeProcessor>::Batch> + 'static, ::Output: PushableIndex + Appendable, // TODO is this needed: Sitemty<::Output>: FrameType, // TODO who exactly needs this DeserializeOwned? Sitemty<<::Output as TimeBinnableType>::Output>: FrameType + DeserializeOwned, { pub fn new(query: PreBinnedQuery, shape: Shape, agg_kind: AggKind, node_config: &NodeConfigCached) -> Self { Self { query, shape, agg_kind, node_config: node_config.clone(), open_check_local_file: None, fut2: None, read_from_cache: false, cache_written: false, data_complete: false, range_complete_observed: false, range_complete_emitted: false, errored: false, completed: false, streamlog: Streamlog::new(node_config.ix as u32), // TODO use alias via some trait associated type: values: <<::Output as TimeBinnableType>::Output as Appendable>::empty(), write_fut: None, read_cache_fut: None, _m1: PhantomData, _m2: PhantomData, _m3: PhantomData, _m4: PhantomData, } } fn setup_merged_from_remotes( &mut self, ) -> Result< Pin::Output as TimeBinnableType>::Output>> + Send>>, Error, > { let evq = RawEventsQuery { channel: self.query.channel().clone(), range: self.query.patch().patch_range(), agg_kind: self.query.agg_kind().clone(), disk_io_buffer_size: self.query.disk_io_buffer_size(), }; if self.query.patch().patch_t_len() % self.query.patch().bin_t_len() != 0 { let msg = format!( "Patch length inconsistency {} {}", self.query.patch().patch_t_len(), self.query.patch().bin_t_len() ); error!("{}", msg); return Err(Error::with_msg(msg)); } // TODO do I need to set up more transformations or binning to deliver the requested data? let count = self.query.patch().patch_t_len() / self.query.patch().bin_t_len(); let range = BinnedRange::covering_range(evq.range.clone(), count as u32)? .ok_or(Error::with_msg("covering_range returns None"))?; let perf_opts = PerfOpts { inmem_bufcap: 512 }; let s = MergedFromRemotes::::new(evq, perf_opts, self.node_config.node_config.cluster.clone()); let ret = TBinnerStream::<_, ::Output>::new( s, range, x_bin_count(&self.shape, &self.agg_kind), ); Ok(Box::pin(ret)) } fn setup_from_higher_res_prebinned( &mut self, range: PreBinnedPatchRange, ) -> Result< Pin::Output as TimeBinnableType>::Output>> + Send>>, Error, > { let g = self.query.patch().bin_t_len(); let h = range.grid_spec.bin_t_len(); trace!( "try_setup_fetch_prebinned_higher_res found g {} h {} ratio {} mod {} {:?}", g, h, g / h, g % h, range, ); if g / h <= 1 { let msg = format!("try_setup_fetch_prebinned_higher_res g {} h {}", g, h); return Err(Error::with_msg(msg)); } if g / h > 1024 * 10 { let msg = format!("try_setup_fetch_prebinned_higher_res g {} h {}", g, h); return Err(Error::with_msg(msg)); } if g % h != 0 { let msg = format!("try_setup_fetch_prebinned_higher_res g {} h {}", g, h); return Err(Error::with_msg(msg)); } let node_config = self.node_config.clone(); let patch_it = PreBinnedPatchIterator::from_range(range); let s = futures_util::stream::iter(patch_it) .map({ let q2 = self.query.clone(); let disk_io_buffer_size = self.query.disk_io_buffer_size(); let disk_stats_every = self.query.disk_stats_every().clone(); let report_error = self.query.report_error(); move |patch| { let query = PreBinnedQuery::new( patch, q2.channel().clone(), q2.agg_kind().clone(), q2.cache_usage().clone(), disk_io_buffer_size, disk_stats_every.clone(), report_error, ); let ret = FetchedPreBinned::<<::Output as TimeBinnableType>::Output>::new( &query, &node_config, )?; Ok(ret) } }) .map(|k| { let s: Pin + Send>> = match k { Ok(k) => Box::pin(k), Err(e) => Box::pin(futures_util::stream::iter(vec![Err(e)])), }; s }) .flatten(); Ok(Box::pin(s)) } fn try_setup_fetch_prebinned_higher_res(&mut self) -> Result<(), Error> { let range = self.query.patch().patch_range(); match PreBinnedPatchRange::covering_range(range, self.query.patch().bin_count() + 1) { Ok(Some(range)) => { self.fut2 = Some(self.setup_from_higher_res_prebinned(range)?); } Ok(None) => { self.fut2 = Some(self.setup_merged_from_remotes()?); } Err(e) => return Err(e), } Ok(()) } } impl Stream for PreBinnedValueStream where NTY: NumOps + NumFromBytes + Serialize + Unpin + 'static, END: Endianness + Unpin + 'static, EVS: EventValueShape + EventValueFromBytes + Unpin + 'static, ENP: EventsNodeProcessor>::Batch> + Unpin + 'static, ::Output: PushableIndex + Appendable, // TODO needed? Sitemty<::Output>: FrameType, Sitemty<<::Output as TimeBinnableType>::Output>: FrameType + DeserializeOwned, { type Item = Sitemty<<::Output as TimeBinnableType>::Output>; fn poll_next(mut self: Pin<&mut Self>, cx: &mut Context) -> Poll> { use Poll::*; 'outer: loop { break if self.completed { panic!("PreBinnedValueStream poll_next on completed"); } else if self.errored { self.completed = true; Ready(None) } else if let Some(item) = self.streamlog.pop() { Ready(Some(Ok(StreamItem::Log(item)))) } else if let Some(fut) = &mut self.write_fut { match fut.poll_unpin(cx) { Ready(item) => { self.cache_written = true; self.write_fut = None; match item { Ok(res) => { self.streamlog.append( Level::INFO, format!( "cache file written bytes: {} duration {} ms", res.bytes, res.duration.as_millis() ), ); continue 'outer; } Err(e) => { self.errored = true; Ready(Some(Err(e))) } } } Pending => Pending, } } else if let Some(fut) = &mut self.read_cache_fut { match fut.poll_unpin(cx) { Ready(item) => { self.read_cache_fut = None; match item { Ok(item) => { self.data_complete = true; self.range_complete_observed = true; Ready(Some(Ok(item))) } Err(e) => { self.errored = true; Ready(Some(Err(e))) } } } Pending => Pending, } } else if self.range_complete_emitted { self.completed = true; Ready(None) } else if self.data_complete { if self.cache_written { if self.range_complete_observed { self.range_complete_emitted = true; let item = RangeCompletableItem::RangeComplete; Ready(Some(Ok(StreamItem::DataItem(item)))) } else { self.completed = true; Ready(None) } } else if self.read_from_cache { self.cache_written = true; continue 'outer; } else { match self.query.cache_usage() { CacheUsage::Use | CacheUsage::Recreate => { let msg = format!( "write cache file query: {:?} bin count: {}", self.query.patch(), self.values.len(), ); self.streamlog.append(Level::INFO, msg); // TODO use alias vias trait: let emp = <<::Output as TimeBinnableType>::Output as Appendable>::empty(); let values = std::mem::replace(&mut self.values, emp); let fut = write_pb_cache_min_max_avg_scalar( values, self.query.patch().clone(), self.query.agg_kind().clone(), self.query.channel().clone(), self.node_config.clone(), ); self.write_fut = Some(Box::pin(fut)); continue 'outer; } _ => { self.cache_written = true; continue 'outer; } } } } else if let Some(fut) = self.fut2.as_mut() { match fut.poll_next_unpin(cx) { Ready(Some(k)) => match k { Ok(item) => match item { StreamItem::Log(item) => Ready(Some(Ok(StreamItem::Log(item)))), StreamItem::Stats(item) => Ready(Some(Ok(StreamItem::Stats(item)))), StreamItem::DataItem(item) => match item { RangeCompletableItem::RangeComplete => { self.range_complete_observed = true; continue 'outer; } RangeCompletableItem::Data(item) => { self.values.append(&item); Ready(Some(Ok(StreamItem::DataItem(RangeCompletableItem::Data(item))))) } }, }, Err(e) => { self.errored = true; Ready(Some(Err(e))) } }, Ready(None) => { self.data_complete = true; continue 'outer; } Pending => Pending, } } else if let Some(fut) = self.open_check_local_file.as_mut() { match fut.poll_unpin(cx) { Ready(item) => { self.open_check_local_file = None; match item { Ok(file) => { self.read_from_cache = true; let fut = <<::Output as TimeBinnableType>::Output as ReadableFromFile>::read_from_file(file)?; self.read_cache_fut = Some(Box::pin(fut)); continue 'outer; } Err(e) => match e.kind() { // TODO other error kinds io::ErrorKind::NotFound => match self.try_setup_fetch_prebinned_higher_res() { Ok(_) => { if self.fut2.is_none() { let e = Err(Error::with_msg(format!( "try_setup_fetch_prebinned_higher_res failed" ))); self.errored = true; Ready(Some(e)) } else { continue 'outer; } } Err(e) => { let e = Error::with_msg(format!( "try_setup_fetch_prebinned_higher_res error: {:?}", e )); self.errored = true; Ready(Some(Err(e))) } }, _ => { error!("File I/O error: kind {:?} {:?}\n\n..............", e.kind(), e); self.errored = true; Ready(Some(Err(e.into()))) } }, } } Pending => Pending, } } else { let cfd = CacheFileDesc::new( self.query.channel().clone(), self.query.patch().clone(), self.query.agg_kind().clone(), ); let path = match self.query.cache_usage() { CacheUsage::Use => cfd.path(&self.node_config), _ => PathBuf::from("DOESNOTEXIST"), }; let fut = async { OpenOptions::new().read(true).open(path).await }; self.open_check_local_file = Some(Box::pin(fut)); continue 'outer; }; } } }