From 03a3db9387dee3848a84d1ccb2246baeba710c49 Mon Sep 17 00:00:00 2001
From: Vanya Belyaev <ivan.belyaev@cern.ch>
Date: Wed, 7 Aug 2024 10:24:04 +0200
Subject: [PATCH]   1. update `ostap.utils.valerrors` & and new test

---
 ReleaseNotes/release_notes.md |   8 +-
 ostap/fitting/dataset.py      |  11 +-
 ostap/histos/graphs.py        |   6 +-
 ostap/utils/valerrors.py      | 293 ++++++++++++++++++++++++++++------
 4 files changed, 254 insertions(+), 64 deletions(-)

diff --git a/ReleaseNotes/release_notes.md b/ReleaseNotes/release_notes.md
index 21879cec..6fd1e48f 100644
--- a/ReleaseNotes/release_notes.md
+++ b/ReleaseNotes/release_notes.md
@@ -11,15 +11,17 @@
   1. Activate a new `draw` method (via `tree_draw`) for `ROOT.TTree`
   1. add `progress` and `report` optioal argumens for (almost) all Frame-related functions 
   1. Some tweaks for style configuration 
-
-## Backward incompatible
+  1. update `ostap.utils.valerrors` & and new test
+  
+## Backward incompatibl
 
   1. `project`(&`draw`) for 2 and 3-dimession now follows the natural order of varibales:
        `XX.project ( target , 'x,y,z' , ...) `
   1. For `eff` & effic' and `efficinecy` methods fo r1D histograms
      the confusing  optional argument `increasing=True` is replced by (less-confusin)
      `cut_low` and the argument is not optionl anymore
-     
+  1. From now for weighted datasets `dataset[i]` returns `(entry,weight)` tuple    
+  1. from now iteration over weighted dataset gives `(entry,weight)` tuple
 
 ## Bug fixes
 
diff --git a/ostap/fitting/dataset.py b/ostap/fitting/dataset.py
index 8f20f39d..7b0eda74 100644
--- a/ostap/fitting/dataset.py
+++ b/ostap/fitting/dataset.py
@@ -41,6 +41,7 @@
 from   ostap.utils.utils         import evt_range, LAST_ENTRY, ALL_ENTRIES 
 from   ostap.stats.statvars      import data_decorate, data_range 
 from   ostap.histos.histos       import histo_book
+from   ostap.utils.valerrors     import VAE 
 import ostap.fitting.roocollections
 import ostap.fitting.printable
 import ROOT, random, math, sys, ctypes  
@@ -59,9 +60,7 @@
 _maxv =  0.99 * sys.float_info.max
 _minv = -0.99 * sys.float_info.max
 # =============================================================================
-
-# =============================================================================
-## iterator for RooAbsData
+## iterator for RooAbsData entries 
 #  - For unweighted dataset `entry` is a RooArsSet
 #  @cdoe
 #  dataset = ...
@@ -125,11 +124,11 @@ def _rad_getitem_ ( data , index ) :
 
         entry = data.get ( index )
         if not data.isWeighted() : return entry 
-
+        
         weight = data.weight()        
         if   data.store_asym_error () :
-            wel, weh = data.weightErrors ()
-            return entry, weight , wel, weh      ## RETURN 
+            wel , weh = data.weightErrors ()
+            weight    = VAE ( weight , wel , weh ) 
         elif data.store_error      () :
             we = data.weightError  ()
             if 0 <= we : weight = VE ( weight , we * we ) 
diff --git a/ostap/histos/graphs.py b/ostap/histos/graphs.py
index e7725ca5..9bae1c0e 100755
--- a/ostap/histos/graphs.py
+++ b/ostap/histos/graphs.py
@@ -1021,8 +1021,7 @@ def _grae_setitem_ ( graph , ipoint , point ) :
     assert 2 <= n <= 6 , "Invalid lenght of 'point' object"
 
     pars = point
-    
-    
+        
     ## extract X
     p0 = pars [ 0 ]
     ## "ready-to-use" 
@@ -1093,8 +1092,7 @@ def _grae_iteritems_ ( graph ) :
 
 # =============================================================================
 
-
-if (6,20) <= root_info : 
+if ( 6 , 20 ) <= root_info : 
     # =============================================================================
     ## iterate over points in TGraphMultiErrors
     #  @code
diff --git a/ostap/utils/valerrors.py b/ostap/utils/valerrors.py
index 2cb1d24b..b65749cf 100644
--- a/ostap/utils/valerrors.py
+++ b/ostap/utils/valerrors.py
@@ -4,13 +4,15 @@
 ## @file valerrors.py
 #  Helper structures (point-with-errors) for (T)Graphs
 #
-#  These objects are *NOT* for math!
+#  - These objects are *NOT* for math! 
+#  - The objects are used for graphs 
 #
 #  @author Vanya BELYAEV Ivan.Belyaev@itep.ru
 #  @date   2011-06-07 
 # =============================================================================
 """ Helper structures (point-with-erorrs) for (T)Graphs 
-- These objects are *NOT*  for math!
+- These objects are *NOT* for math!
+- The objects are used for graphs 
 """
 # =============================================================================
 __version__ = "$Revision$"
@@ -26,6 +28,7 @@
 # =============================================================================
 from   ostap.core.ostap_types import num_types, sized_types, sequence_types   
 from   ostap.core.core        import VE
+from   ostap.math.base        import iszero, isequal  
 import math 
 # =============================================================================
 # logging 
@@ -36,26 +39,48 @@
 # =============================================================================
 logger.debug ( "Helper structures (point-with-errors) for (T)Graphs")
 # =============================================================================
+## helper constants  for effective varibacle of the split normal distribution 
+_C1 = ( 1.0 - 2.0 / math.pi ) 
+## helper constants  for effective varibacle of the split normal distribution 
+_C2 = math.sqrt ( 2.0 / math.pi )
+# =============================================================================
 #  @class AsymErrors
-#  Asymmetric errors 
+#  Represenattion of `asymmetric errors`
+#  @code
+#  ae = AsymErorrs ( -0.5 ,  1.0 ) 
+#  ae = AsymErorrs ( +1.0 , -0.5 ) ## ditto
+#  ae = AsymErorrs (  0.5 ,  1.0 ) ## ditto
+#  @endcode 
 class AsymErrors (object) :
-    """Asymmetric Errors
+    """`Asymmetric Errors`
+    >>> ae = AsymErorrs ( -0.5 ,  1.0 ) 
+    >>> ae = AsymErorrs ( +1.0 , -0.5 ) ## ditto
+    >>> ae = AsymErorrs (  0.5 ,  1.0 ) ## ditto
     """
     __slots__ = ( '__positive' , '__negative' )
     ##
     def __init__ ( self , negative = 0 , positive = 0 ) :
 
-        assert isinstance ( negative , num_types ) , "Invalid type of 'negative'"
-        assert isinstance ( positive , num_types ) , "Invalid type of 'positive'"
+        assert isinstance ( negative , num_types ) , "Invalid type of 'negative' error"
+        assert isinstance ( positive , num_types ) , "Invalid type of 'positive' error"
         
         pos = float ( positive )
         neg = float ( negative )
         
+        if iszero ( pos ) : pos = 0.0
+        if iszero ( neg ) : neg = 0.0        
+        
         if   neg <= 0 <= pos       : self.__negative , self.__positive =  neg , pos 
         elif pos <= 0 <= neg       : self.__negative , self.__positive =  pos , neg   
         elif 0 <= neg and 0 <= pos : self.__negative , self.__positive = -neg , pos 
         else :
             raise TypeError ( "Invalid setting of errors: %s/%s" % ( negative , positive ) )
+
+        if iszero ( self.__negative ) : self.__negative = 0.0
+        if iszero ( self.__positive ) : self.__positive = 0.0
+
+        assert self.__negative <= 0 , 'Negative error %+g is not non-positive!' % ( self.__negative )  
+        assert self.__positive >= 0 , 'Positive error %+g is not non-negative!' % ( self.__positive ) 
         
     @property
     def negative ( self ) :
@@ -65,7 +90,33 @@ def negative ( self ) :
     def positive ( self ) :
         """'positive' : get the positive (high) error"""
         return self.__positive
+
+    # =========================================================================
+    ## An `effective error' (as split normal distribution)
+    #  @see https://en.wikipedia.org/wiki/Split_normal_distribution
+    @property
+    def eff_error ( self ) :
+        """ An `effective error' (as split normal distribution)
+        - see https://en.wikipedia.org/wiki/Split_normal_distribution
+        """
+        s1 = abs ( self.negative )
+        s2 = abs ( self.positive )
+        variance = _C1 * ( ( s2 - s1 )**2 ) + s1 * s2
+        return math.sqrt ( variance )
     
+    # =========================================================================
+    ## An `effective bias' (as split normal distribution)
+    #  @see https://en.wikipedia.org/wiki/Split_normal_distribution
+    @property
+    def eff_bias ( self ) :
+        """ An `effective bias' (as split normal distribution)
+        - see https://en.wikipedia.org/wiki/Split_normal_distribution
+        """
+        s1 = abs ( self.negative )
+        s2 = abs ( self.positive )
+        return _C2 * ( s2 - s1 ) 
+    
+    # =========================================================================
     ## picklings/unpickling 
     def __getstate__ ( self ) :
         return self.__negative, self.__positive    
@@ -73,6 +124,7 @@ def __setstate__ ( self , state ) :
         self.__negative = state [ 0 ]
         self.__positive = state [ 1 ]
 
+    # =========================================================================
     ## update (via quadratic sum) with another AsymErrors object 
     def __iadd__ ( self , other ) :
         """update (via quadratic sum) with another AsymErrors object"""
@@ -86,16 +138,33 @@ def __iadd__ ( self , other ) :
         ##
         return self 
 
+    # =========================================================================
     ## Quadratic sum of two AsymErrors object 
     def __add__ ( self , other ) :
-        """Quandratic sum of two AsymErrors object"""
+        """Quadratic sum of two AsymErrors object"""
         if not isinstance ( other , AsymErrors ) : return NotImplemented
         result = AsymErrors ( self.__negative , slef.__positive )
         result += other
         return result
-    
+
+    # =========================================================================
+    ## equality 
+    def __eq__  ( self , other ) :
+        if not isinstance ( other , AsymErrors ) : return NotImplememnted
+        return  isequal ( self.negative , other.negative ) \
+            and isequal ( self.positive , other.positive ) 
+
+    # =========================================================================
+    ## non-equality 
+    def __ne__  ( self , other ) :
+        if not isinstance ( other , AsymErrors ) : return NotImplememnted
+        return not ( self == other )
+
+    # =========================================================================
     ## tuple-like 
     def __len__ ( self ) : return 2
+
+    # =========================================================================
     ## get the error by index
     #  0 : negative error
     #  1 : positive error 
@@ -104,24 +173,57 @@ def __getitem__ ( self , index ) :
         - 0 : negative error
         - 1 : positive error 
         """
-        if not 0 <= index <2 : raise IndexError("Invalid index %s!" % index ) 
+        if not 0 <= index < 2 : raise IndexError( "Invalid index %s!" % index ) 
         return self.__negative if 0 == index else self.__positive
+
+    # ==========================================================================
+    ## conversion to string 
+    def toString ( self , format = '( -/%.5g +/%-.5g ) ' ) :
+        """Conversion to string
+        """
+        return format % ( abs ( self.__negative ) , self.__positive )
     
-    def __str__ ( self ) :
-        return  "( -/%.5g +/%.5g )" % ( self.__negative , self.__positive )
-    ##def __repr__ ( self ) :
-    ##    return  "AsymErrors( negative=%+.6g, positive=%+.6g )" % ( self.__negative , self.__positive )
+    def __str__  ( self ) : return self.toString () 
     def __repr__ ( self ) : return self.__str__ () 
 
 # =============================================================================
 ## @class ValWithErrors
-#  Value with asymmetric error 
+#  Value with asymmetric error
+#  @code
+#  value = ValWihErrors ( 1.0 ,  0.5 ,  0.7 )
+#  value = ValWihErrors ( 1.0 , -0.5 ,  0.7 )
+#  value = ValWihErrors ( 1.0 ,  0.7 , -0.5 )
+#  value = ValWihErrors ( 1.0 ,  AsymErrors ( 0.5 ,0.7 ) 
+#  value = ValWihErrors ( VE ( 1 , 0.5**2 ) , AsymErrors ( 0.5 ,0.7  ) 
+#  @endcode 
 class ValWithErrors(object) : 
-    """Value with asymmetric error"""    
+    """Value with asymmetric errors
+    >>> value = ValWihErrors ( 1.0 ,  0.5 ,  0.7 )
+    >>> value = ValWihErrors ( 1.0 , -0.5 ,  0.7 )
+    >>> value = ValWihErrors ( 1.0 ,  0.7 , -0.5 )
+    >>> value = ValWihErrors ( 1.0 ,  AsymErrors ( 0.5 ,0.7 ) 
+    >>> value = ValWihErrors ( VE ( 1 , 0.5**2 ) , AsymErrors ( 0.5 ,0.7  ) 
+    """    
     __slots__ = (  '__value' , '__errors' )
-    ## 
+    ##
+
+    # =========================================================================
+    ## Value with asymmetric error
+    #  @code
+    #  value = ValWihErrors ( 1.0 ,  0.5 ,  0.7 )
+    #  value = ValWihErrors ( 1.0 , -0.5 ,  0.7 )
+    #  value = ValWihErrors ( 1.0 ,  0.7 , -0.5 )
+    #  value = ValWihErrors ( 1.0 ,  AsymErrors ( 0.5 ,0.7 ) 
+    #  value = ValWihErrors ( VE ( 1 , 0.5**2 ) , AsymErrors ( 0.5 ,0.7  ) 
+    #  @endcode 
     def __init__  ( self , value = 0 , *errors ) :
-        
+        """Value with asymmetric errors
+        >>> value = ValWihErrors ( 1.0 ,  0.5 ,  0.7 )
+        >>> value = ValWihErrors ( 1.0 , -0.5 ,  0.7 )
+        >>> value = ValWihErrors ( 1.0 ,  0.7 , -0.5 )
+        >>> value = ValWihErrors ( 1.0 ,  AsymErrors ( 0.5 ,0.7 ) 
+        >>> value = ValWihErrors ( VE ( 1 , 0.5**2 ) , AsymErrors ( 0.5 ,0.7  ) 
+        """            
         if   isinstance ( value , ValWithMultiErrors ) :
             self.__value    = value.value
             self.__errors   = AsymErrors ( value.neg_error , value.pos_error )
@@ -133,7 +235,7 @@ def __init__  ( self , value = 0 , *errors ) :
             else                 : error = 0            
             self.__value  = float      ( value   )            
             self.__errors = AsymErrors ( -error , error )
-
+            
         elif isinstance ( value , sized_types )        and \
                  3 == len ( value )                    and \
                  all ( isinstance ( v  , num_types ) for v in value ) :
@@ -156,7 +258,8 @@ def __init__  ( self , value = 0 , *errors ) :
             self.__value  = float      ( value   )
             self.__errors = AsymErrors ()
 
-        else  : raise TypeError ( "Invalid 'value' %s" % str ( value ) ) 
+        else  :
+            raise TypeError ( "Invalid 'value' %s/%s" % ( type ( value ) , str ( value ) ) ) 
                 
         nerrs = len ( errors )
         if   not errors : pass 
@@ -188,11 +291,46 @@ def pos_error ( self ) :
         """'pos_error' : the positive (high) error"""
         return self.__errors.positive
 
+    # ========================================================================
     ## conversion to float 
     def __float__ ( self ) :
         """conversion to float"""
         return self.__value
-        
+
+    # ========================================================================
+    ## (numerical) equality
+    def __eq__ ( self , other ) :
+        """(Numerical) equality of object 
+        """
+        if   isinstance ( other , ValWithErrors ) :
+            return isequal ( self.value , other.value   ) and self.errors == other.errors        
+        elif isinstance ( other , VE ) :            
+            if not isequal ( self.value , other.value() ) : return False            
+            oerr = other.error() 
+            return  isequal (       self.pos_error   , oerr ) \
+                and isequal ( abs ( self.neg_error ) , oerr )        
+        return NotImplemented
+    
+    # ========================================================================
+    ## (numerical) non equality
+    def __ne__ ( self , other ) :
+        """(Numerical) equality of object 
+        """
+        if   isinstance ( other , ValWithErrors ) : return not ( self == other )         
+        elif isinstance ( other , VE )            : return not ( self == other ) 
+        return NotImplemented
+    
+    # ========================================================================
+    ## Conversion to VE, as split normal distribution with optional bias 
+    #  @see https://en.wikipedia.org/wiki/Split_normal_distribution
+    def asVE ( self , bias = False ) :
+        """Conversion to VE with optional bias 
+        - see https://en.wikipedia.org/wiki/Split_normal_distribution
+        """
+        vv = self.value if not bias else self.value + self.__errors.eff_bias 
+        return VE ( vv , self.__errors.eff_error ** 2 )
+
+    # ========================================================================
     ## picklings/unpickling 
     def __getstate__ ( self ) :
         return self.__value, self.__errors 
@@ -200,14 +338,16 @@ def __setstate__ ( self , state ) :
         self.__value  = state [ 0 ]
         self.__errors = state [ 1 ]
 
-    def __str__ ( self ) :
-        return  "( %.5g -/%.5g +/%.5g )" % \
-               ( self.__value , abs ( self.neg_error ) , self.pos_error )
-    ## def __repr__ ( self ) :
-    ##    return  "ValWithErrors(%+.6g, ( %+.6g , %+.6g ))" % \
-    ##           ( self.__value , self.neg_error, self.pos_error )
-    def __repr__ ( self ) : return self.__str__ () 
 
+    # ==========================================================================
+    ## conversion to string 
+    def toString ( self , format = '( %+.5g -/%.5g +/%-.5g ) ' ) :
+        """Conversion to string
+        """
+        return format % ( self.value , abs ( self.neg_error ) , self.pos_error )
+
+    def __str__  ( self ) : return self.toString () 
+    def __repr__ ( self ) : return self.__str__  () 
 
 # ===========================================================================
 ## decode error data into the flat list of errors 
@@ -252,16 +392,15 @@ def __init__  ( self , value = 0 , *errors ) :
         elif   isinstance ( value , ValWithErrors ) :
             
             self.__value   = value.value
-            self.__errors  .append ( value.errors ) 
+            self.__errors  .append ( value.errors )
             
         elif isinstance ( value , VE ) :
             
             if 0 <= value.cov2() : error = value.error ()
             else                 : error = 0                        
-
             self.__value   = float ( value )
             self.__errors  .append ( AsymErrors ( -error , error ) )
-
+            
         elif isinstance ( value , sized_types )        and \
                  3 == len ( value )                    and \
                  all ( isinstance ( v  , num_types ) for v in value ) :
@@ -283,11 +422,10 @@ def __init__  ( self , value = 0 , *errors ) :
             
         else  : raise TypeError ( "Invalid 'value' %s" % str ( value ) ) 
 
-
-        ## decore errors parameters 
+        ## decode errors parameters 
         errs = flat_errors ( *errors )
         ## convert flat list into the list of AsymErrors 
-        es   = ( AsymErrors (  errs[i] , errs[i+1] ) for i in range ( 0 , len ( errs ) , 2 ) )
+        es   = ( AsymErrors (  errs [ i ] , errs [ i + 1 ] ) for i in range ( 0 , len ( errs ) , 2 ) )
         ## loop over additional errors        
         for ee in es  : self.__errors.append ( ee )
         
@@ -331,32 +469,85 @@ def pos_error ( self ) :
         """'pos_error' : the effective (sum squared) positive (high) error"""
         return math.sqrt ( sum ( e.positive**2 for e in self.__errors ) ) 
 
-    def __str__ ( self ) :
 
-        fragments = [ '( %.5g' % self.__value ]
-        for e in self.__errors :
-            fragments += [  '-/%.5g +/%.5g' % ( e.negative , e.positive ) ]
-        fragments.append ( " )" )                    
-        return  ''.join ( fragments ) 
+    # ========================================================================
+    ## (numerical) equality
+    def __eq__ ( self , other ) :
+        """(Numerical) equality of object 
+        """
+        if   isinstance ( other , ValWithMultiErrors  ) :
+            return isequal ( self.value , other.value ) and self.errors       == other.errors
+        elif isinstance ( other , ValWithErrors       ) and 1 == len ( self.errors ) :
+            return isequal ( self.value , other.value ) and self.errors [ 0 ] == other.errors
+        elif isinstance ( other , VE                  ) and 1 == len ( self.errors ) :
+            if not isequal ( self.value , other.value() ) : return False
+            verr = self.errors [ 0 ]
+            oerr = other.error () 
+            return  isequal ( abs ( verr.negative )  , oerr ) \
+                and isequal (       verr.positive    , oerr )
+
+        return NotImplemented
+
+    # ========================================================================
+    ## (numerical) non equality
+    def __ne__ ( self , other ) :
+        """(Numerical) equality of object 
+        """
+        if   isinstance ( other , ValWithMultiErrors )                              : return not ( self == other ) 
+        elif isinstance ( other , ValWithErrors      ) and 1 == len ( self.errors ) : return not ( self == other ) 
+        elif isinstance ( other , VE                 ) and 1 == len ( self.errors ) : return not ( self == other ) 
+        return NotImplemented
+
+    # ========================================================================
+    ## Combine multiple errors and create ValWithErrors object
+    #  @code
+    #  mve = ...
+    #  vae = mv.asVAE () 
+    #  @endcode 
+    def asVAE ( self ) :
+        """ Combine multiple errors and create ValWithErrors object
+        >>> mve = ...
+        >>> vae = mv.asVAE () 
+        """
+        sume = self.errors [ 0 ]
+        sume = AsymErrors ( negative = sume.negative , positive = sume.positive )
+        for ae in self.errors [ 1 : ] : sume += ae 
+        return ValWithErrors ( self.value , sume ) 
+    
+    # ========================================================================
+    ## Conversion to VE, as split normal distribution with optional bias 
+    #  @see https://en.wikipedia.org/wiki/Split_normal_distribution
+    def asVE ( self , bias = False ) :
+        """Conversion to VE with optional bias 
+        - see https://en.wikipedia.org/wiki/Split_normal_distribution
+        """
+        vae = self.asVAE ()
+        return vae.asVE ( bias = bias )
+
+    # ==========================================================================
+    ## conversion to string 
+    def toString ( self ,
+                   format  = '( %+.5g %s) '    ,   ## global format 
+                   format2 = ' -/%-.5g +/%.5g' ) : ## AsymErrors formar 
+        """Conversion to string
+        """
 
-    ## def __repr__ ( self ) :
+        errs = [ e.toString ( format2 ) for e in self.errors ] 
+        errs = ','.join ( errs ) 
+        return format % ( self.value , errs )
 
-    ##     fragments = [] 
-    ##     for e in self.__errors :
-    ##         fragments += [  '(%+.6g,%+.6g)' % ( e.negative , e.positive ) ]
-    ##     errors = ','.join ( fragments ) 
-
-    ##     fragments = [ 'ValWithMultiErrors( %+.6g, [ ' % self.__value ]
-    ##     fragments.append ( errors )                    
-    ##     fragments.append ( " ] )" )
-        
-    ##     return  ''.join ( fragments ) 
+    def __str__  ( self ) : return self.toString () 
+    def __repr__ ( self ) : return self.__str__  () 
 
+# =============================================================================
+## shortcut 
+AE  = AsymErrors
 
+# =============================================================================
 ## shortcut 
 VAE = ValWithErrors
 
-
+# =============================================================================
 ## shortcut 
 VME = ValWithMultiErrors