src/main/scala/io/sqooba/oss/timeseries/TimeSeries.scala

package io.sqooba.oss.timeseries

import java.util.concurrent.TimeUnit

import io.sqooba.oss.timeseries.bucketing.TimeBucketer
import io.sqooba.oss.timeseries.immutable._
import io.sqooba.oss.timeseries.window.{TimeAwareReversibleAggregator, TimeUnawareReversibleAggregator, WindowSlider}

import scala.concurrent.duration.TimeUnit
import scala.reflect.runtime.universe._

trait TimeSeries[+T] {

  /** The value valid at time 't' if there is one. */
  def at(t: Long): Option[T]

  /** The whole entry containing the value valid at time 't', if there is one */
  def entryAt(t: Long): Option[TSEntry[T]]

  /** Split this time series into two.
   *
   * Returns a tuple of two contiguous time series,
   * such that the left time series is never defined for t >= 'at'
   * and the right time series is never defined for t < 'at'.
   *
   * Default implementation simply returns (this.trimRight(at), this.trimLeft(at))
   */
  def split(at: Long): (TimeSeries[T], TimeSeries[T]) = (this.trimRight(at), this.trimLeft(at))

  /**
   * Split this time series into two.
   *
   * If 'at' is within the domain of a particular entry, the time series will be split either
   * at the beginning or end of that entry, according to the passed 'splitAfterEntry'
   */
  def splitDiscrete(at: Long, splitAfterEntry: Boolean = true): (TimeSeries[T], TimeSeries[T]) =
    (this.trimRightDiscrete(at, splitAfterEntry), this.trimLeftDiscrete(at, !splitAfterEntry))

  /** Extract a slice from this time series.
   *
   * The returned slice will only be defined between the specified bounds such that:
   *
   *  this.at(x) == returned.at(x) for all x in [from, to[.
   *
   * If x is outside of the bounds, returned.at(x) is None.
   */
  def slice(from: Long, to: Long): TimeSeries[T] = this.trimLeft(from).trimRight(to)

  /**
   * Extract a slice from this time series, while preventing entries on the slice boundaries
   * from being split.
   */
  def sliceDiscrete(from: Long, to: Long, fromInclusive: Boolean = true, toInclusive: Boolean = true): TimeSeries[T] =
    this.trimLeftDiscrete(from, fromInclusive).trimRightDiscrete(to, toInclusive)

  /** Returns a time series that is never defined for t >= at and unchanged for t < at */
  def trimRight(at: Long): TimeSeries[T]

  /** Similar to trimRight, but if `at` lands within an existing entry,
   * the returned time series' domain is either, depending on 'includeEntry':
   *  - extended to that entry's end of validity, which fully remains in the time series (the default)
   *  - trimmed further to the previous entry's end of validity, fully removing the entry from the time series
   */
  def trimRightDiscrete(at: Long, includeEntry: Boolean = true): TimeSeries[T]

  /** Returns a time series that is never defined for t < at and unchanged for t >= at */
  def trimLeft(at: Long): TimeSeries[T]

  /** Similar to trimLeft, but if `at` lands within an existing entry,
   * the returned time series' domain is either, depending on 'includeEntry':
   *  - extended to that entry's timestamp, which fully remains in the time series (the default)
   *  - trimmed further to the next entry's timestamp, fully removing the entry from the time series
   */
  def trimLeftDiscrete(at: Long, includeEntry: Boolean = true): TimeSeries[T]

  /** The number of elements in this time series. */
  def size: Int

  /** Convenient and efficient method for `size == 0` */
  def isEmpty: Boolean

  /** Convenient method for !isEmpty */
  def nonEmpty: Boolean = !isEmpty

  /** True if this time series is defined at 'at'. Ie, at('at') would return Some[T] */
  def defined(t: Long): Boolean = at(t).isDefined

  /** Returns true if it is guaranteed that this timeseries was compressed at construction.
   * If this returns false it is not known whether the series has been compressed.
   */
  def isCompressed: Boolean

  /** Map the values within the time series.
   *
   * @param compress controls whether or not compression should occur on the output series.
   *                 If set to false, timestamps and validities remain unchanged. Defaults to true.
   */
  def map[O: WeakTypeTag](f: T => O, compress: Boolean = true): TimeSeries[O] =
    mapEntries[O](e => f(e.value), compress)

  /** Map the values within the time series. If not compressing, the timestamps and
   * validities of entries remain unchanged, but the time is made available for
   * cases where the new value would depend on it.
   *
   * @param compress controls whether or not compression should occur on the output series.
   *                 Defaults to true.
   */
  @deprecated("Deprecated in favor of 'mapEntries'.")
  def mapWithTime[O: WeakTypeTag](f: (Long, T) => O, compress: Boolean = true): TimeSeries[O] =
    mapEntries[O](e => f(e.timestamp, e.value), compress)

  /** Map the values within the time series. If not compressing, the timestamps and
   * validities of entries remain unchanged, but they are made available for cases
   * where the new value would depend on them.
   *
   * @param compress controls whether or not compression should occur on the output series.
   *                 Defaults to true.
   */
  def mapEntries[O: WeakTypeTag](f: TSEntry[T] => O, compress: Boolean = true): TimeSeries[O]

  /** Map the values within the time series to an option. Results of the form 'Some(v)'
   * will be kept as entries with 'v'. 'None' results will be discarded.
   *
   * @param compress controls whether or not compression should occur on the output series.
   *                 If set to false, timestamps and validities remain unchanged. Defaults to true.
   */
  def filterMap[O](f: T => Option[O], compress: Boolean = true): TimeSeries[O] =
    filterMapEntries(entry => f(entry.value), compress)

  /** Map the entries within this series to options. Results of the form 'Some(v)' will
   * be kept as entries with 'v'. 'None' results will be discarded.
   *
   * @note The default implemenation is not optimised, consider overriding it for
   *       better performance, for example see
   *       [[io.sqooba.oss.timeseries.immutable.VectorTimeSeries.filterMapEntries* here]].
   *
   * @param compress controls whether or not compression should occur on the output series.
   *                 If set to false, timestamps and validities remain unchanged. Defaults to true.
   */
  def filterMapEntries[O](f: TSEntry[T] => Option[O], compress: Boolean = true): TimeSeries[O] =
    mapEntries(f, compress).filter(_.isDefined).map(_.get, compress)

  /** Return a time series that will only contain entries for which the passed predicate
   * returned True.
   */
  def filterEntries(predicate: TSEntry[T] => Boolean): TimeSeries[T]

  /** Return a time series that will only contain entries containing values for which
   * the passed predicate returned True.
   */
  def filter(predicate: T => Boolean): TimeSeries[T] =
    filterEntries(tse => predicate(tse.value))

  /** Fill the wholes in the definition domain of this time series with the passed value.
   * The resulting time series will have a single continuous definition domain,
   * provided the original time series was non-empty.
   */
  def fill[U >: T](whenUndef: U): TimeSeries[U] = {
    val (start, end) = (this.head.timestamp, this.last.definedUntil)
    this.fallback(TSEntry(start, whenUndef, end - start))
  }

  /** Return a Seq of the TSEntries representing this time series. */
  def entries: Seq[TSEntry[T]]

  /** Return a Seq of the values contained by this series, in their chronological order. */
  def values: Seq[T] = entries.map(_.value)

  /** Return the first (chronological) entry in this time series.
   *
   * @throws NoSuchElementException if this time series is empty.
   */
  def head: TSEntry[T] = headOption.get

  /** Return a filled option containing the first (chronological) entry in this
   * time series.
   * None if this time series is empty.
   */
  def headOption: Option[TSEntry[T]]

  /** Return the first (chronological) value in this time series.
   *
   * @throws NoSuchElementException if this time series is empty.
   */
  def headValue: T = head.value

  /** Return a filled option containing the first (chronological) value in this
   * time series.
   * None if this time series is empty.
   */
  def headValueOption: Option[T] = headOption.map(_.value)

  /** Return the last (chronological) entry in this time series.
   *
   * @throws NoSuchElementException if this time series is empty.
   */
  def last: TSEntry[T] = lastOption.get

  /** Return a filled option containing the last (chronological) entry in this
   * time series.
   * None if this time series is empty.
   */
  def lastOption: Option[TSEntry[T]]

  /** Return the last (chronological) value in this time series.
   *
   * @throws NoSuchElementException if this time series is empty.
   */
  def lastValue: T = last.value

  /** Return a filled option containing the last (chronological) value in this time series.
   * None if this time series is empty.
   */
  def lastValueOption: Option[T] = lastOption.map(_.value)

  /** Append the 'other' time series to this one at exactly the first of other's entries timestamp.
   *
   * if t_app = other.head.timestamp, this time series domain will be completely forgotten for all
   * t > t_app, and replaced with whatever is in the domain of 'other'.
   *
   * This is equivalent to right-trimming this time series at other.head.timestamp and prepending
   * it as-is to 'other'.
   *
   * If 'other' is empty, this time series is unchanged.
   */
  def append[U >: T](other: TimeSeries[U], compress: Boolean = true): TimeSeries[U] =
    other.headOption
      .map(head => this.trimRight(head.timestamp).entries ++ other.entries)
      .map(_.foldLeft(newBuilder[U](compress))(_ += _).result())
      .getOrElse(this)

  /** Prepend the 'other' time series to this one at exactly the last of other's entries definedUntil().
   *
   * if t_prep = other.last.definedUntil, this time series domain will be completely forgotten for all
   * t <= t_prep, and replaced with whatever is in the domain of 'other'.
   *
   * This is equivalent to left-trimming this time series at other.last.definedUntil and appending
   * it as-is with to 'other'.
   *
   * If 'other' is empty, this time series is unchanged.
   */
  def prepend[U >: T](other: TimeSeries[U], compress: Boolean = true): TimeSeries[U] =
    other.lastOption
      .map(last => other.entries ++ this.trimLeft(last.definedUntil).entries)
      .map(_.foldLeft(newBuilder[U](compress))(_ += _).result())
      .getOrElse(this)

  /**
   * Merge another time series to this one, using the provided operator
   * to merge entries.
   *
   * The operator can define all four cases encountered during merging:
   *   - both entries defined
   *   - only one of the entries defined
   *   - no entry defined
   *
   * In any case, the returned time series will only be defined between the
   * bounds defined by min(this.head.timestamp, other.head.timestamp) and
   * max(this.last.definedUntil, other.last.definedUntil).
   */
  def merge[O, R](op: (Option[T], Option[O]) => Option[R])(other: TimeSeries[O]): TimeSeries[R] =
    TimeSeriesMerger
      .mergeEntries(this.entries, other.entries, compress = false)(op)
      .foldLeft(this.newBuilder[R]())(_ += _)
      .result()

  /**
   * Merge another time series to this one, using the provided operator
   * to merge entries. The resulting series has the value defined by the operator
   * at all times where both input series are defined. At all other times (i.e. where only one
   * or none of the input series is defined), the resulting series is not defined.
   *
   * @param op    the operator for the merge
   * @param other TimeSeries to merge
   * @return the strictly merged TimeSeries
   */
  def strictMerge[O, R](op: (T, O) => R)(other: TimeSeries[O]): TimeSeries[R] =
    this.merge[O, R] {
      case (Some(t), Some(o)) => Some(op(t, o))
      case _                  => None
    }(other)

  /**
   * Sum the entries within this and the provided time series such that
   *
   * - If strict (default): this.at(x) + other.at(x) = returned.at(x) where x may take any value where
   * both time series are defined.
   * - If non strict : this.at(x) + other.at(x) = returned.at(x) where x may take any value where
   * any time series is defined.
   */
  def plus[U >: T](other: TimeSeries[U], strict: Boolean = true)(implicit n: Numeric[U]): TimeSeries[U] = {
    import n._

    if (strict) {
      strictMerge[U, U](_ + _)(other)
    } else {
      merge[U, U](NumericTimeSeries.nonStrictPlus(_, _)(n))(other)
    }
  }

  def +[U >: T](other: TimeSeries[U])(implicit n: Numeric[U]): TimeSeries[U] = plus(other)(n)

  /**
   * Subtract the entries within this and the provided time series such that
   * this.at(x) - other.at(x) = returned.at(x) where x may take any value where
   * both time series are defined.
   */
  def minus[U >: T](
    other: TimeSeries[U],
    leftHandDefault: Option[U] = None,
    rightHandDefault: Option[U] = None
  )(implicit n: Numeric[U]): TimeSeries[U] =
    merge[U, U](NumericTimeSeries.nonStrictMinus(leftHandDefault, rightHandDefault)(_, _)(n))(other)

  def -[U >: T](other: TimeSeries[U])(implicit n: Numeric[U]): TimeSeries[U] = minus(other)

  /**
   * Multiply the entries within this and the provided time series such that
   * this.at(x) * other.at(x) = returned.at(x) where x may take any value where
   * both time series are defined.
   */
  def multiply[U >: T](other: TimeSeries[U])(implicit n: Numeric[U]): TimeSeries[U] = {
    import n._

    strictMerge[U, U](_ * _)(other)
  }

  def *[U >: T](other: TimeSeries[U])(implicit n: Numeric[U]): TimeSeries[U] = multiply(other)

  /**
   * Zips this time series with another one, returning a time series
   * of tuples containing the values from both this and the other time
   * series across their common domain.
   */
  def strictZip[O](other: TimeSeries[O]): TimeSeries[(T, O)] = strictMerge[O, (T, O)]((_, _))(other)

  /**
   * Computes the integral of this time series.
   * This function returns a step function, so only represents an approximation.
   * Use it if you need to compute multiple integrals of the same time series.
   */
  def stepIntegral[U >: T](stepLengthMs: Long, timeUnit: TimeUnit = TimeUnit.MILLISECONDS)(implicit n: Numeric[U]): TimeSeries[Double] = {
    TimeSeries.ofOrderedEntriesUnsafe(
      NumericTimeSeries.stepIntegral[U](
        this.splitEntriesLongerThan(stepLengthMs).entries,
        timeUnit
      )
    )
  }

  @deprecated("This function does only sum values in a slice of the series. Use slice and stepIntegral or slidingIntegral.")
  def integrateBetween[U >: T](from: Long, to: Long)(implicit n: Numeric[U]): U =
    this.slice(from, to).entries.map(_.value).sum(n)

  /**
   * Splits up all entries of this timeseries that are longer than the given maximal length.
   * This is slightly similar but not strictly equivalent to resampling a series:
   * if you need some form of resampling, make sure this is what you need.
   *
   * @param entryMaxLength to use for splitting
   * @return timeseries with entries guaranteed to be shorter than the given
   *         maximal length
   */
  def splitEntriesLongerThan(entryMaxLength: Long): TimeSeries[T] =
    TimeSeries
      .splitEntriesLongerThan(entries, entryMaxLength)
      // we don't want to compress the consecutive equal entries that result from
      // splitting a long entry up
      .foldLeft(newBuilder[T](compress = false))(_ += _)
      .result()

  /** Compute a new time series that will contain, for any query time t, the integral
   * over the entries present in this time series that are defined for a time
   * between t - window and t.
   *
   * Note: returns a step function, meaning that there is a slight level of
   * imprecision depending on your resolution. The bigger the window is relative to
   * the sampleRate, the smaller the imprecision becomes.
   *
   * @param window   width of the window
   * @param timeUnit time unit used for this entry. By default, milliseconds are assumed.
   * @param sampleRate frequency of resampling
   * @return a TimeSeries that for any queried time will return an approximate integral of
   *         this time series over the past window
   */
  def slidingIntegral[U >: T](
    window: Long,
    sampleRate: Long,
    timeUnit: TimeUnit = TimeUnit.MILLISECONDS
  )(implicit n: Numeric[U]): TimeSeries[Double] =
    NumericTimeSeries
      .slidingIntegral[U](this.entries, window, sampleRate, timeUnit)
      .foldLeft(newBuilder[Double]())(_ += _)
      .result()

  /** Slides a window of size 'windowWidth' over the entries present in this series.
   * It calculates some aggregate on each window that does not depend on the time of
   * validity of the entries. As the given aggregator is reversible this can be done
   * efficiently.
   *
   * Each returned entry E is calculated from the entries of the original time
   * series that intersect with any window that ends in the domain of E.
   *
   * @note The difference between [[rollup()]] and [[slidingWindow()]] is that
   * rollup generates disjoint slices of the time series and aggregates over those,
   * whereas for sliding window an entry can be part of multiple windows.
   *
   * @param windowWidth width of the window
   * @param aggregator a reversible aggregator to efficiently compute aggregations over the window
   * @return a new series contianing all the aggregates as entries
   */
  def slidingWindow[U >: T, A](
    windowWidth: Long,
    aggregator: TimeUnawareReversibleAggregator[U, A]
  ): TimeSeries[A] =
    aggregateStreamToSeries(
      WindowSlider.window(this.entries.toStream, windowWidth, aggregator)
    )

  /** See [[slidingWindow()]]. This function slides a window and uses a time-aware
   * aggregator, i.e. the aggregated values can depend on the duration of validity
   * of each entry (example: average weighted by time of validity). Therefore it
   * samples the entries first.
   *
   * @param sampleRate to resample the entries
   * @param useClosestInWindow whether to sample strictly or not (see [[TimeSeries.sample()]])
   */
  def slidingWindow[U >: T, A](
    windowWidth: Long,
    aggregator: TimeAwareReversibleAggregator[U, A],
    sampleRate: Long,
    useClosestInWindow: Boolean = true
  ): TimeSeries[A] =
    aggregateStreamToSeries(
      WindowSlider.window(this.entries.toStream, windowWidth, aggregator, sampleRate, useClosestInWindow)
    )

  private def aggregateStreamToSeries[A](seq: Seq[(TSEntry[_], Option[A])]): TimeSeries[A] =
    seq.flatMap {
      // Drop the content of the window, just keep the aggregator's result.
      case (entry, aggregateOpt) => aggregateOpt.map(a => entry.map(_ => a))
    }.foldLeft(newBuilder[A]())(_ += _)
      .result()

  /** Sample this TimeSeries at fixed time intervals of length sampleRate starting at
   * the start timestamp. By default, all resulting entries will have the duration
   * of sampleRate. If equal contiguous entries are compressed (set the compress flag)
   * all entries have a duration that is a multiple of sampleRate.
   *
   * In the strict mode (useClosestInWindow = false), the sampled values are exactly
   * equal to the value of this TimeSeries at the sample points. In the
   * useClosestInWindow mode, the sampling looks at the entries in the window of
   * `[samplePoint - sampleRate/2, samplePoint + sampleRate/2[`. The value of the
   * entry that starts the closest to the samplePoint among those starting in the
   * window is taken.
   *
   * @note In either case, this function does **not** perform any kind of
   *       aggregation or roll-up.
   * @param start              timestamp of first sample point
   * @param sampleRate         interval between sample points
   * @param useClosestInWindow enables non-strict look-around sampling
   * @param compress           specifies whether equal contiguous entries should be compressed
   * @return the sampled time series
   */
  def sample(start: Long, sampleRate: Long, useClosestInWindow: Boolean, compress: Boolean = false): TimeSeries[T] =
    TimeSeries
      .sample(this.entries, start, sampleRate, useClosestInWindow)
      .foldLeft(newBuilder[T](compress))(_ += _)
      .result()

  /**
   * Buckets this TimeSeries into sub-time series that have a domain of definition that is at most that
   * specified by the passed bucket boundaries.
   *
   * @param buckets a stream of times representing bucket boundaries. A stream of (a, b, c, ...)
   *                will generate buckets with domain (([a, b[), ([b, c[), ...)
   *                Note that it is wise to have 'buckets' start at a meaningfully close point in time
   *                relative to the time series first entry.
   * @return a stream of (bucket-start, time series).
   */
  def bucket(buckets: Stream[Long]): Stream[(Long, TimeSeries[T])] =
    TimeBucketer.bucketEntriesToTimeSeries(buckets, this.entries, newBuilder[T]())

  /** Given the passed bucket delimiters, apply 'aggregator' for each generated bucket.
   *
   * Note that the timestamps and validities of the entries present in the returned
   * time series are ONLY driven by the boundaries generated by 'buckets': the first
   * and last entry may well be defined outside of the domain of definition of this
   * time series.
   *
   * @note The difference between [[rollup()]] and [[slidingWindow()]] is that
   * rollup generates disjoint slices of the time series and aggregates over those,
   * whereas for sliding window an entry can be part of multiple windows.
   *
   * @param buckets a stream generating the bucket boundaries for the rollup/aggregation
   * @param aggregator a function that computes an aggregate over a time series
   * @tparam R the type returned by the aggregator
   * @return a TimeSeries, the values of which are generated by the aggregator and the entries' domains
   *         are defined by the respective buckets.
   */
  def rollup[R](buckets: Stream[Long], aggregator: TimeSeries[T] => R): TimeSeries[R] =
    bucket(buckets)
    // Slide so that we may have the end of the bucket in context
      .sliding(2)
      // Build a (bucketStart, bucketEnd, relevantValue) triple
      .map(pair => (pair.head._1, pair.tail.head._1, aggregator(pair.head._2)))
      .foldLeft(newBuilder[R]())((accum, triple) => accum += TSEntry(triple._1, triple._3, triple._2 - triple._1))
      .result()

  /**
   * Returns the bounds of the domain
   *
   * If the time series does not contain any "hole" in its domain, then the loose domain is equal to
   * its domain. Otherwise, the loose domain only contains the min/max bounds of the domain.
   *
   * Said otherwise, the time series is guaranteed to be undefined outside of the loose domain, and
   * has at least a point where it is defined within the loose domain.
   *
   * @return The oldest and newest timestamps where the time series is defined, encapsulated in a `LooseDomain`
   */
  def looseDomain: TimeDomain

  /**
   * Fallback to `other` when `this` is not defined
   *
   * @param other Another time series which should contain the value when `this` is not defined
   * @tparam U The new underlying parameter
   * @return A time series which contains the values of `this` if defined, and of `other` otherwise
   */
  def fallback[U >: T](other: TimeSeries[U]): TimeSeries[U] =
    merge[U, U] {
      case (Some(v), _)    => Some(v)
      case (_, otherValue) => otherValue
    }(other)

  /**
   * @return The probability that the time series is defined over its loose-domain
   */
  def supportRatio: Double

  /** Returns true if it is guaranteed that this timeseries is defined for all t in its looseDomain.
   * I. e. whether there are holes in its time domain or not.  If this returns false it is not
   * known whether the series has been compressed.
   */
  def isDomainContinuous: Boolean

  /**
   * @return a builder that constructs a new timeseries of this implementation
   */
  def newBuilder[U](compress: Boolean = true)(implicit tag: WeakTypeTag[U]): TimeSeriesBuilder[U] =
    TimeSeries.newBuilder(compress)
}

object TimeSeries {

  /** For any collection of TSEntries of size 2 and more, intersperses entries containing
   * fillValue between any two non-contiguous entries.
   *
   * Assumes the passed entries to be both properly fitted (no overlapping domains) and
   * compressed (no contiguous entries containing the same value).
   *
   * The result will be properly fitted and compressed as well.
   */
  def fillGaps[T](in: Seq[TSEntry[T]], fillValue: T): Seq[TSEntry[T]] =
    TimeSeries.ofOrderedEntriesUnsafe(in).fill(fillValue).entries

  /** @see [[TimeSeriesMerger.mergeEntries]] */
  def mergeEntries[A, B, C](a: Seq[TSEntry[A]])(b: Seq[TSEntry[B]])(op: (Option[A], Option[B]) => Option[C]): Seq[TSEntry[C]] =
    TimeSeriesMerger.mergeEntries(a, b, compress = true)(op)

  /**
   * Groups the entries in the stream into substreams that each contain at most
   * maxNumberOfEntries.
   *
   * @param entries            as a stream
   * @param maxNumberOfEntries contained by each substream of the result
   * @return a stream of (bucket-start, bucket-entries)
   */
  def groupEntries[T](
    entries: Stream[TSEntry[T]],
    maxNumberOfEntries: Int
  ): Stream[(Long, Stream[TSEntry[T]])] =
    entries
      .grouped(maxNumberOfEntries)
      .toStream
      .map(substream => (substream.head.timestamp, substream))

  /**
   * Splits up all entries in the input that are longer than the given maximal length.
   *
   * @param entryMaxLength to use for splitting
   * @return a sequence of entries guaranteed to be shorter than the given
   *         maximal length
   */
  def splitEntriesLongerThan[T](entries: Seq[TSEntry[T]], entryMaxLength: Long): Seq[TSEntry[T]] =
    entries.flatMap(entry => entry.splitEntriesLongerThan(entryMaxLength).entries)

  /** See [[TimeSeries.sample()]] in the trait. Implements the sampling on a stream
   * of entries with lazy stream evaluation.
   */
  def sample[T](
    entries: Seq[TSEntry[T]],
    start: Long,
    sampleRate: Long,
    useClosestInWindow: Boolean
  ): Seq[TSEntry[T]] = {

    @inline
    def tooFarToTake(next: TSEntry[_], samplePoint: Long): Boolean =
      if (useClosestInWindow) next.timestamp > samplePoint + sampleRate / 2
      else next.timestamp > samplePoint

    def rec(samplePoint: Long, remaining: Stream[TSEntry[T]]): Stream[TSEntry[T]] =
      remaining match {
        case Stream() => Stream()

        // The next entry is still too far away, we just go to the next sample point.
        case next +: _ if tooFarToTake(next, samplePoint) =>
          rec(samplePoint + sampleRate, remaining)

        // We take the value of the current entry if:
        case current +: next +: _
            // In strict mode, we only take the value if it is defined at the sample point.
            if !useClosestInWindow && samplePoint < current.definedUntil

            // In useClosest mode we take the currently defined value if the next.
            // entry is out of the window
              || useClosestInWindow && (
                  samplePoint < current.definedUntil && next.timestamp > samplePoint + sampleRate / 2

                  // But we also take the value if its start is closer to the next's start.
                    || Math.abs(current.timestamp - samplePoint) < Math.abs(next.timestamp - samplePoint)
                ) =>
          TSEntry(samplePoint, current.value, sampleRate) #:: rec(samplePoint + sampleRate, remaining)

        // For the last entry, we only take its value if it is still defined
        // at the sample point.
        case Seq(last) if samplePoint < last.definedUntil =>
          TSEntry(samplePoint, last.value, sampleRate) #:: rec(samplePoint + sampleRate, remaining)

        // Otherwise, we can't use the current entry anymore and drop it.
        case _ => rec(samplePoint, remaining.tail)
      }

    rec(start, entries.toStream)
  }

  /**
   * Computes the union of the passed time series' loose domains
   *
   * @param tss A sequence of time series
   * @tparam T The underlying type of the time series
   * @return The union of the LooseDomains
   */
  def unionLooseDomains[T](tss: Seq[TimeSeries[T]]): TimeDomain =
    tss.map(_.looseDomain).fold(EmptyTimeDomain)(_.looseUnion(_))

  /**
   * Computes the intersection of the passed time series' loose domains
   *
   * @note If there is an empty time series, then the intersection will be None.
   * @param tss A sequence of time series
   * @tparam T The underlying type of the time series
   * @return The intersection of the LooseDomains
   */
  def intersectLooseDomains[T](tss: Seq[TimeSeries[T]]): TimeDomain =
    if (tss.isEmpty) {
      EmptyTimeDomain
    } else {
      tss.map(_.looseDomain).reduce(_.intersect(_))
    }

  /**
   * Construct a time series using an ordered Seq of TSEntries
   *
   * The correct underlying implementation will be used depending of the Seq's size
   * (i.e. EmptyTimeSeries, TSEntry, or a VectorTimeSeries)
   *
   * @note The sequence has to be chronologically ordered, otherwise the time series might
   *       not behave correctly. In general, you should use a `TimeSeries.newBuilder`. Furthermore, no
   *       two entries should have the same timestamp. Finally, entries will NOT be compressed.
   * @param xs                A sequence of TSEntries which HAS to be chronologically ordered (w.r.t. their timestamps) and
   *                          well-formed (no duplicated timestamps)
   * @param isCompressed      Flags whether the xs' have been compressed in their construction.
   *                          Will be passed to the underlying implementation.
   * @param isDomainContinuous Flags whether all the entries span a continuous time domain without holes.
   *                          Will be passed to the underlying implementation.
   * @tparam T The underlying type of the time series
   * @return A time series with a correct implementation
   */
  def ofOrderedEntriesUnsafe[T](
    xs: Seq[TSEntry[T]],
    isCompressed: Boolean = false,
    isDomainContinuous: Boolean = false
  ): TimeSeries[T] = {
    val size = xs.size

    if (size == 0) {
      EmptyTimeSeries
    } else if (size == 1) {
      xs.head
    } else {
      VectorTimeSeries.ofOrderedEntriesUnsafe(xs, isCompressed, isDomainContinuous)
    }
  }

  /**
   * Construct using a time series `TimeSeriesBuilder` given an ordered list of entries
   *
   * The correct underlying implementation will be chosen (EmptyTimeSeries, TSEntry or VectorTimeSeries).
   * As we are using a `TimeSeriesBuilder`, the entries will be compressed if possible.
   *
   * @note No two entries can have the same timestamp, an exception will be thrown if it's the case.
   * @param xs       A sequence of TSEntries which HAS to be chronologically ordered (w.r.t. their timestamps) and
   *                 well-formed (no duplicated timestamps)
   * @param compress A flag specifying whether the entries should be compressed or not.
   * @tparam T The underlying type of the time series
   * @return A compressed time series with a correct implementation
   */
  def ofOrderedEntriesSafe[T](xs: Seq[TSEntry[T]], compress: Boolean = true): TimeSeries[T] =
    xs.foldLeft(newBuilder[T](compress))(_ += _).result()

  /**
   * An safe constructor of `TimeSeries`
   *
   * The given entries are sorted, compressed (if needed) and returned as a time series. If the sequence
   * is empty, then it returns an `EmptyTimeSeries`. If the sequence is made of only one entry, then it returns
   * it.
   *
   * @note All entries should have different timestamps.
   * @param entries A sequence of entries which all have a different timestamp
   * @tparam T The time series' underlying parameter
   * @return A well initialized time series
   */
  def apply[T](entries: Seq[TSEntry[T]]): TimeSeries[T] = ofOrderedEntriesSafe(entries.sorted)

  /**
   * @return the default timeseries builder implementation
   */
  def newBuilder[T](compress: Boolean = true): TimeSeriesBuilder[T] = new VectorTimeSeries.Builder[T](compress)
}