Module `ambit_stochastics.trawl`

A container class for the simulation, parameter inference and forecasting of trawl processes $X_t = L(A_t)$ .

Expand source code

"""A container class for the simulation, parameter inference and forecasting of trawl processes \(X_t = L(A_t)\)."""
################## module imports ##################
from scipy.signal import convolve2d 
from scipy.integrate import quad
#from numba import njit
import numpy as np
import math

#flip the filter  in the convolution step
#from .helpers.input_checks  import check1
from .helpers.input_checks  import check_grid_params
from .helpers.input_checks  import check_cpp_params
from .helpers.input_checks  import check_trawl_function
from .helpers.input_checks  import check_jump_part_and_params
from .helpers.input_checks  import check_gaussian_params

 
from .helpers.sampler                            import gaussian_part_sampler 
from .helpers.sampler                            import jump_part_sampler
from .helpers.sampler                            import generate_cpp_points
from .helpers.acf_functions                      import fit_trawl_envelope_gmm
from .helpers.marginal_distribution_functions    import fit_trawl_marginal
#from .heleprs.sampler     import generate_cpp_values_associated_to_points

from .helpers.alternative_convolution_implementation import cumulative_and_diagonal_sums

from .helpers.forecasting_helpers import deterministic_forecasting
from .helpers.forecasting_helpers import probabilistic_forecasting


#from scipy.optimize import minimize
#from statsmodels.tsa.stattools import acf
#helper_module = import_file(os.path.join(Path().resolve().parent,'helpers','loss_functions'))
###################################################

class trawl:
    def __init__(self,nr_simulations,nr_trawls = None, trawl_function=None, tau = None, 
                decorrelation_time = -np.inf, mesh_size = None, times_grid = None, 
                truncation_grid = None, gaussian_part_params= (0,0), jump_part_name=None,
                jump_part_params= None, cpp_times = None, cpp_truncation = None, cpp_part_name = None, cpp_part_params = None,
                cpp_intensity = None, custom_sampler = None, values=None):
        """Please consult the `Trawl processes example usage` jupyter notebook from https://github.com/danleonte/Ambit_Stochastics
        to see a practical example with detailed explanations.
        
        The implemented simulation algorithms are the grid, slice and cpp algorithms, as described in [paper link]. Parameter inference and forecasting methods to be added.

        The arguments required for the `simulate` method are `nr_simulations` and `trawl_function`.
        Further, the slice method requires `nr_trawls`,
        `tau`, `decorrelation_time`, `gaussian_part_params`, `jump_part_name`,`jump_part_params`,
         the grid method requires
        `mesh_size`,`times_grid`,`truncation_grid`, `gaussian_part_params`,`jump_part_name`,`jump_part_params` and
         the cpp method requires `cpp_truncation,`,`cpp_part_name`, `cpp_times`
        `cpp_part_params`, `cpp_intensity` and `custom_sampler`.
               
        Args:
          The following parameters are for any of simulation algorithms.
          
          nr_simulations: positive integer: number of simulations of the trawl process.
          trawl_function: a non-negative, continuous, strictly increasing function \(\phi \colon (-\infty,0] \\to [0,\infty)\) with \(\phi(0) >0, \phi(t) =0\) for \(t>0\).

          The following parameters are for both the slice and grid simulation methods.
          
          gaussian_part_params: tuple with the mean and standard deviation of the Gaussian Part
          jump_part_name: tuple with the parameters of the jump part distribution check `helpers.sampler` for the parametrisation.
          jump_part_params: string: name of the jump part distribution. check `helpers.sampler` for the parametrisation.

          The following parameters are for the slice simulation method.
          
          nr_trawls: positive integer: number of ambit sets on the time axis.
          tau: positive number: spacing between ambit sets on the time axis; the times at which we simulate the trawl processes are then \(\\tau, \\ldots,\\text{nr_trawls} \ \\tau\).
          decorrelation_time: \(-\infty\) if the ambit set A is unbounded and finite, negative otherwise. For example, if \(\phi(x) = (1+x)(x>-1)(x<=0)\), `decorrelation_time =-1`.
      
          The following parameters are for the grid simulation method.

          mesh_size: positive float, side-length of each cell.
          times_grid: array: times at which to simulate the trawl process, necessarly in increasing order.
          truncation_grid: strictly negative float: in the grid simulation method, we simulate the parts of the ambit sets contained in \(t > \\text{truncation_grid} + \\text{min(times_grid)}\).

          The following parameters are for both the cpp simulation methods.

          cpp_times: array: times at which to simulate the trawl process.
          cpp_truncation: strictly negative float: we simulate the parts of the ambit sets contained in \(t > \\text{cpp_truncation} + \\text{min(cpp_times)}\).
          cpp_part_name: to add
          cpp_part_params: to add
          cpp_intensity: to add
          custom_sampler: to add
              
          values: a numpy array with shape \([\\text{nr_simulations},k_s,k_t]\) which is passed by the user or simulated with the method `simple_ambit_field.simulate`.
         """
       
        #general attributes
        self.nr_simulations  = nr_simulations
        #attributes required for simulation
        self.trawl_function                 = trawl_function
        
        #########################################################################
        ### attributes required for both grid and slice simulation algorithms ###
        
        # distributional parameters of the gaussian and jump parts of the levy seed 
        # jump_part_name and jump_part_params are also requried for the grid method
        
        self.gaussian_part_params           = gaussian_part_params
        self.jump_part_name                 = jump_part_name
        self.jump_part_params               = jump_part_params

        
        #############################################################################     
        ### attributes required only for the slice partition simulation algorithm ###  
   
        self.nr_trawls                      = nr_trawls
        self.tau                            = tau
        self.decorrelation_time             = decorrelation_time
        self.I                              = None
        self.slice_areas_matrix             = None

        
        ################################################################## 
        ### attributes required only for the grid simulation algorithm ###
        
        self.times_grid               = times_grid
        self.truncation_grid          = truncation_grid       
        self.mesh_size                = mesh_size
        self.times_grid               = times_grid
        self.vol                      = None
        
        #self.indicator_matrix               = None
        
        ################################################################## 
        ### attributes required only for the cpp simulation algorithm  ###
        
        self.cpp_truncation  = cpp_truncation
        self.cpp_part_name   = cpp_part_name 
        self.cpp_part_params = cpp_part_params
        self.cpp_intensity   = cpp_intensity
        self.custom_sampler  = custom_sampler
        self.cpp_times       = cpp_times
            
        ### arrays containing the gaussian, jump and cpp parts of the simulation
        self.gaussian_values          =   None 
        self.jump_values              =   None 
        self.cpp_values               =   None 
        
        ### passed by the user or to be simulated using one of the simulation methods ### 
        self.values                   =   values 
        
        #if the values are passed by the use and not simulated
        if values is not None:
            self.nr_simulations, self.nr_tralws = self.values.shape
            
             
        #############################################################################     
        ### attributes required only for the parameter inference ###  
        self.infered_parameters   = None
        # {'envelope': exponential, 'levy_seed': 'gamma', 'params' : 
        #    {'envelope_params': tuple of tuples , 'levy_seed_params': tuple of tuples}}
        
    ######################################################################
    ###  Simulation algorithms:      I slice, II grid, III cpp         ###
    ######################################################################
    
    
       ########################### I Slice ###########################

    
    def compute_slice_areas_finite_decorrelation_time(self):
        """Computes the \(I \\times k\) matrix 
        
        \[\\begin{bmatrix}
              a_0     &  a_0 - a_1          \\ldots  & a_0 - a_1          \\\\
              a_1     &  a_1 - a_2          \\ldots  & a_1 - a_2          \\\\
              a_2     &  a_2 - a_3          \\ldots  & a_2 - a_3          \\\\
                      &                     \\vdots  &                    \\\\
              a_{k-2} & a_{k-2} - a_{k-1}   \\ldots  & a_{k-2} - a_{k-1}  \\\\
              a_{k-1} & a_{k-1}                      & a_{k-1}            
        \\end{bmatrix}\]
        
        corresponding to the areas of the slices 
        
                
        \[\\begin{bmatrix}
        L(S_{11})  & \\ldots & L(S_{1,k-1}) & L(S_{1k}) \\\\
        L(S_{21})  &  \\ldots &  L(S_{2,k-1}) & L(S_{2k}) \\\\
         \\vdots &       &  \\vdots  & \\vdots  \\\\
        L(S_{I1}) &  \\ldots &  L(S_{I,k-1}) & L(S_{I,k})
        \\end{bmatrix}
        \]
            
        where \(k =\) `self.nr_trawls` and 
        
        \[\\begin{align}
        a_0 &= \int_{-\\tau}^0 \phi(u)du, \\\\
            \\vdots & \\\\
        a_{k-2} &= \int_{(-k+1)\\tau} ^{(-k+2)  \\tau} \phi(u) du, \\\\
        a_{k-1} &= \int_{\\text{decorrelation_time}}^{(-k+1)\\tau} \phi(u)du.
        \\end{align} 
        \]            
            """
        self.I = math.ceil(-self.decorrelation_time/self.tau)
        
        s_i1 = [quad(self.trawl_function,a=-i *self.tau, b = (-i+1) * self.tau)[0]
                for i in range(1,self.I+1)]
        s_i2 = np.append(np.diff(s_i1[::-1])[::-1],s_i1[-1])
        
        right_column = np.tile(s_i2[:,np.newaxis],(1,self.nr_trawls-1))
        left_column  = left_column  = (np.array(s_i1))[:,np.newaxis]
        self.slice_areas_matrix  = np.concatenate([left_column,right_column],axis=1)
        
        #to add I-1 columns of length I zeros
        #check entire program here and comapre with previous versions
                
    
    def compute_slice_areas_infinite_decorrelation_time(self):
        """Computes the  \(k \\times k\) matrix  
        
        \[\\begin{bmatrix}
              a_0     &  a_0 - a_1  & a_0 - a_1  &    \\ldots  & a_0 - a_1  & a_0 - a_1  & a_0 \\\\
              a_1     &  a_1 - a_2  & a_1 - a_2  &    \\ldots  & a_1 - a_2  & a_1        & 0   \\\\
              a_2     &  a_2 - a_3  & a_2 - a_3  &    \\ldots  & a_2        & 0          & 0   \\\\
                      &             &            &    \\vdots  &            &            &     \\\\
              a_{k-2} & a_{k-1}     & 0          &    \\ldots  &  0         & 0          & 0   \\\\
              a_{k-1} & 0           & 0          &             &  0         & 0          & 0
        \\end{bmatrix}\]
            
        corresponding to the areas of the slices 
        
                
        \[\\begin{bmatrix}
        L(S_{11})  & \\ldots & L(S_{1k,-1}) & L(S_{1k}) \\\\
        L(S_{21})  &  \\ldots &  L(S_{2,k-1}) & 0 \\\\
         \\vdots &       &  \\vdots  & \\vdots  \\\\
        L(S_{k1}) &  \\ldots &  0 & 0
        \\end{bmatrix}
        \]
         
        
        where \(k =\) `self.nr_trawls` and 
        
        \[\\begin{align}
        a_0 &= \int_{-\\tau}^0 \phi(u)du, \\\\
            \\vdots & \\\\
        a_{k-2} &= \int_{(-k+1)\\tau} ^{(-k+2)  \\tau} \phi(u) du, \\\\
        a_{k-1} &= \int_{-\infty}^{(-k+1)\\tau} \phi(u)du.
        \\end{align} 
        \]
        """
        s_i1 =  [quad(self.trawl_function,a=-i *self.tau, b = (-i+1) * self.tau)[0]
                 for i in range(1,self.nr_trawls)] + [quad(self.trawl_function,a=-np.inf,
                                                           b=(-self.nr_trawls+1)*self.tau)[0]]
        
                                                           
        #  a[0] -a[1] ,a[1] -a[2], ... , a[k-2] - a[k-1] , 0
        differences   = np.append(np.diff(s_i1[::-1])[::-1],0) 

        left_column  = np.array(s_i1)[:,np.newaxis]  
        right_column = np.zeros((self.nr_trawls,1))
        #we reconstruct the elements on the secondary diagonal at the end
        
                                                     
        middle_matrix = np.tile(differences[:,np.newaxis],(1,self.nr_trawls-2))
        whole_matrix  = np.concatenate([left_column,middle_matrix,right_column],axis=1)
        whole_matrix_reversed   = np.triu(np.fliplr(whole_matrix), k=0)
        np.fill_diagonal(whole_matrix_reversed,s_i1)     

        self.slice_areas_matrix = np.fliplr(whole_matrix_reversed)
    
    def simulate_slice_finite_decorrelation_time(self,slice_convolution_type):
        """helper for the `simulate_slice` method"""
        
        filter_ = np.fliplr(np.tril(np.ones(self.I),k=0)) 
        zero_matrix  = np.zeros([self.I,self.I-1])

        for simulation_nr in range(self.nr_simulations):
            gaussian_slices = gaussian_part_sampler(self.gaussian_part_params,self.slice_areas_matrix) 
            jump_slices     = jump_part_sampler(self.jump_part_params,self.slice_areas_matrix,self.jump_part_name)
            
            if slice_convolution_type == 'fft':
        
                gaussian_slices = np.concatenate([zero_matrix,gaussian_slices],axis=1)
                jump_slices = np.concatenate([zero_matrix,jump_slices],axis=1)
        
                #matrix with 1's on and below the secondary diagonal
                #flip the filter to agree with np convention
                self.gaussian_values[simulation_nr,:] = convolve2d(gaussian_slices,filter_[::-1,::-1],'valid')[0]
                self.jump_values[simulation_nr,:]     = convolve2d(jump_slices,filter_[::-1,::-1],'valid')[0]
        
            elif slice_convolution_type == 'diagonals':
                
                self.gaussian_values[simulation_nr,:] = cumulative_and_diagonal_sums(gaussian_slices)
                self.jump_values[simulation_nr,:] =  cumulative_and_diagonal_sums(jump_slices)
                
                
    def simulate_slice_infinite_decorrelation_time(self,slice_convolution_type):
        """Helper for the `simulate_slice` method."""

        zero_matrix     = np.zeros([self.nr_trawls,self.nr_trawls-1])
        filter_         = np.fliplr(np.tril(np.ones(self.nr_trawls),k=0)) 


        for simulation_nr in range(self.nr_simulations):
            
            gaussian_slices = gaussian_part_sampler(self.gaussian_part_params,self.slice_areas_matrix) 
            
            #the lower triangular part of the matrix is made oup of 0's, which can result in an error
            #in the scipy.stats sampler (for example, if the levy seed is gamma)
            #to prevent this, we extract the upper triangular part of the matrix as a vector
            #sample this way, then recast the samples as an upper triangular matrix
            slice_areas_row   = (np.fliplr(self.slice_areas_matrix))[np.triu_indices(self.slice_areas_matrix.shape[0], k = 0)]
            jump_slices_row   = jump_part_sampler(self.jump_part_params,slice_areas_row,self.jump_part_name)
            jump_slices       = np.zeros(gaussian_slices.shape)
            jump_slices[np.triu_indices(jump_slices.shape[0], k = 0)]     = jump_slices_row
            jump_slices       = np.fliplr(jump_slices)
             

            if slice_convolution_type == 'fft':
                gaussian_slices = np.concatenate([zero_matrix,gaussian_slices],axis=1)
                jump_slices     = np.concatenate([zero_matrix,jump_slices],axis=1)
                
                self.gaussian_values[simulation_nr,:] = convolve2d(gaussian_slices,filter_[::-1,::-1],'valid')[0]
                self.jump_values[simulation_nr,:]     = convolve2d(jump_slices,filter_[::-1,::-1],'valid')[0]
                
            elif slice_convolution_type == 'diagonals':
                
                self.gaussian_values[simulation_nr,:] = cumulative_and_diagonal_sums(gaussian_slices)
                self.jump_values[simulation_nr,:] =  cumulative_and_diagonal_sums(jump_slices)
        
        
    def simulate_slice(self,slice_convolution_type):
        """implements algorithm [] from [] and simulates teh trawl process at 
        \(\\tau,\\ldots,\\text{nr_trawls}\ \\tau\). `slice_convolution_type` can be either [to add]"""
        if self.decorrelation_time == -np.inf:
            self.compute_slice_areas_infinite_decorrelation_time()
            self.simulate_slice_infinite_decorrelation_time(slice_convolution_type)
             
        elif self.decorrelation_time > -np.inf:
            assert(self.trawl_function(self.decorrelation_time)) == 0,'please check decorrelation time' 
            self.compute_slice_areas_finite_decorrelation_time()
            self.simulate_slice_finite_decorrelation_time(slice_convolution_type)
        #self.values = self.gaussian_values + self.jump_values

                      
       ############################ II Grid ############################
    
    def grid_creation(self,min_t,max_t):
        """Creates a grid on \([0,\phi(0)] \\times [\\text{min_t}, \\text{max_t}]\). Each cell is represented by 
        the coordinates of its bottom left corner. To each cell we associate a sample from each of the gaussian
        and jump parts of the trawl process.
        
        Returns:
          gaussian_values:  array with the Gaussian of the Levy basis evaluated over the cells  
          jump_values: array with the jump part of the Levy basis evaluated over the cells      
        """
            
        coords = np.mgrid[0:self.trawl_function(0):self.mesh_size,min_t:max_t:self.mesh_size]
        x, t   = coords[0].flatten(), coords[1].flatten() 
        
        areas            = self.vol * np.ones([self.nr_simulations,len(t)])
        gaussian_values  = gaussian_part_sampler(self.gaussian_part_params,areas)
        jump_values      = jump_part_sampler(self.jump_part_params,areas,self.jump_part_name)
        
            
        return x,t,gaussian_values,jump_values
    
    def grid_update(self,i,t,gaussian_values,jump_values):
        """Inputs the values of the Levy basis evaluated over the grid cells on \([\\tau_{i-1}+\\text{truncation_grid},\\tau_{i-1}] \\times [0,\\phi(0)]\),
        removes the values corresponding to cells with time coordinates less than \(\\tau_{i} + \\text{truncation_grid}\) and adds new samples
        for the levy basis evaluated over the grid cells with time coordinates in \([\\tau_{i-1},\\tau_i]\) (see figure). 
        Assumes that the consecutive ambit sets at times \(\\tau_{i-1},\\tau_i\) are not disjoint, i.e.
        \(\\tau_i + \\text{truncation_grid} < \\tau_{i-1}\).
        
        Args:
          i: index of the trawl to be simulated
          t: time coordinates of the cells of the grid on \([\\tau_{i-1},\\tau_{i-1}+\\text{truncation_grid}] \\times [0,\phi(0)]\)
          gaussian_values: gaussian values for the grid on \([\\tau_{i-1},\\tau_{i-1}+\\text{truncation_grid}] \\times [0,\phi(0)]\)
          jump_values: jump values for the grid on \([\\tau_{i-1},\\tau_{i-1}+\\text{truncation_grid}] \\times [0,\phi(0)\)
        
        Returns:
          gaussian_values: gaussian values for the grid cells on \([\\tau_{i},\\tau_{i}+\\text{truncation_grid}] \\times [0,\phi(0)]\)
          jump_values: jump values for the grid cells on \([\\tau_{i},\\tau_{i}+\\text{truncation_grid}] \\times [0,\phi(0)]\)                                                                                                                                                                                                
         """
          

        ind_to_keep       =  t >= (self.times_grid[i] + self.truncation_grid)
        t[~ind_to_keep]  += -self.truncation_grid
        
        areas             = self.vol * np.ones([self.nr_simulations,sum(~ind_to_keep)])
        #print(gaussian_values[:,~ind_to_keep].shape)
        #print(self.gaussian_part_sampler(areas).shape)
        gaussian_values[:,~ind_to_keep] = gaussian_part_sampler(self.gaussian_part_params,areas)
        jump_values[:,~ind_to_keep]     = jump_part_sampler(self.jump_part_params,areas,self.jump_part_name)  
        #print('ind to keep sum is ', ind_to_keep.sum())
        #print('gaussian is ',gaussian_values.shape)
        #print('non_gaussian_values ',non_gaussian_values[:,ind_to_keep].shape)
        #print('new_gaussian_values ',new_gaussian_values.shape)
        #print('t new shape is ',t.shape)
        #print('x shape is', x.shape)
        
        return t,gaussian_values,jump_values   
    
    
    def simulate_grid(self):
        """Simulate the trawl proces at times `self.times_grid`, which don't have to be
        equally distant, via the grid method."""
        
        #If `times_grid` are equidistnant, we do not need to compute `indicators` at each iteration, speeding up the process        

        for i in range(len(self.times_grid)):
             if (i==0) or (self.times_grid[i-1] <= self.times_grid[i] + self.truncation_grid):
                 #check that we are creating the grid for the first time or that 
                 #trawls at time i-1 and i have empty intersection
                 x,t,gaussian_values, jump_values = self.grid_creation(self.times_grid[i] + self.truncation_grid, self.times_grid[i])

                
             elif self.times_grid[i-1] > self.times_grid[i] + self.truncation_grid:
                 #check that we have non empty intersection and update the grid
                 t,gaussian_values,jump_values = self.grid_update(i,t,gaussian_values,jump_values)
            
             indicators = x < self.trawl_function(t-self.times_grid[i])
             #print(gaussian_values.shape,indicators.shape)
             self.gaussian_values[:,i]  = gaussian_values @ indicators
             self.jump_values[:,i]      = jump_values @ indicators
             
        #self.values = self.gaussian_values + self.jump_values
       ########################### III cpp ###########################
#    @njit   
    def simulate_cpp(self):
        """ text to be added"""
        min_t = min(self.cpp_times) + self.cpp_truncation
        max_t = max(self.cpp_times)
        min_x = 0
        max_x = self.trawl_function(0)
        
        for simulation_nr in range(self.nr_simulations):
            
        
            points_x, points_t, associated_values = generate_cpp_points(min_x = min_x, max_x = max_x, 
                        min_t = min_t, max_t = max_t, cpp_part_name = self.cpp_part_name,
                        cpp_part_params = self.cpp_part_params, cpp_intensity = self.cpp_intensity,
                        custom_sampler = self.custom_sampler)
                                    
            #(x_i,t_i) in A_t if t < t_i and x_i < phi(t_i-t)
            indicator_matrix = np.tile(points_x[:,np.newaxis],(1,self.nr_trawls)) < \
                            self.trawl_function(np.subtract.outer(points_t, self.cpp_times))
            self.cpp_values[simulation_nr,:] = associated_values @ indicator_matrix
                            
        
       ####################### simulate meta-method #######################
    def simulate(self,method,slice_convolution_type='diagonals'):
         """Function to simulate from the trawl function. Contains sanity checks
         for the simulation parameters and uses helper functions for each simulation
         method.
         
         Args:
           method: one of the strings `cpp`, `grid` or `slice`
           slice_convolution_type: if method is set to `slice`, this can be one of the strings `diagonals` or `ftt`, depending on the way we add up the simulated slices. This argument is ignored if method is set to `grid` or `cpp`."""

         #general checks
         assert isinstance(self.nr_simulations,int) and self.nr_simulations >0
         assert method in {'cpp','grid','slice'},'simulation method not supported'
         check_trawl_function(self.trawl_function)
         check_gaussian_params(self.gaussian_part_params)
         
         
         #algorithm specific checks and attribute setting
         if method == 'grid':
             check_jump_part_and_params(self.jump_part_name,self.jump_part_params)
             check_grid_params(self.mesh_size,self.truncation_grid,self.times_grid)
             
             self.nr_trawls = len(self.times_grid)
             self.vol = self.mesh_size **2
             
         elif method == 'cpp':
             check_cpp_params(self.cpp_part_name, self.cpp_part_params,self.cpp_intensity,self.custom_sampler)

             self.nr_trawls = len(self.cpp_times)
                 
         elif method == 'slice':
             assert slice_convolution_type in {'fft','diagonals'}
             assert isinstance(self.nr_trawls,int) and self.nr_trawls > 0,'nr_trawls should be a  strictly positive integer'
             check_jump_part_and_params(self.jump_part_name,self.jump_part_params)

             
         self.gaussian_values          =   np.zeros(shape = [self.nr_simulations,self.nr_trawls]) 
         self.jump_values              =   np.zeros(shape = [self.nr_simulations,self.nr_trawls])
         self.cpp_values               =   np.zeros(shape = [self.nr_simulations,self.nr_trawls])
        
        
         if method == 'grid':
             self.simulate_grid()
         elif method == 'cpp':
             self.simulate_cpp()
         elif method == 'slice':
             self.simulate_slice(slice_convolution_type)    

         self.values = self.gaussian_values + self.jump_values + self.cpp_values
         
             
    def theoretical_acf(self,t_values):
        """Computes the theoretical acf of the trawl process
        
        Args:
          t_values: array of time values 
        
        Returns:
          d_acf: a dictionary of the type  \(t: \\text{corr}(X_0,X_t)\), where \(t\) ranges over the input array `t_values`. 
        """
        total_area = quad(self.trawl_function,a=-np.inf,b= 0)[0]
        d_acf=dict()
        for t in t_values:
            d_acf[t] = quad(self.trawl_function,a=-np.inf,b= -t)[0]/total_area
        return d_acf
                  

             
    ######################################################################
    ###  Forecasting:      determinstic and probabilistic              ###
    ######################################################################
    
    
    def fit_gmm(self,input_values,envelope,levy_seed,lags,initial_guess=None):

        
        assert isinstance(lags,tuple) and all(isinstance(i,int) for i in lags)
        
        print('gmm fit started')
        
        envelope_params  = fit_trawl_envelope_gmm(self.tau,input_values,lags,envelope,initial_guess)
        levy_seed_params = fit_trawl_marginal(input_values,levy_seed)
        params =  {'envelope_params':envelope_params,'levy_seed_params': levy_seed_params}
        self.infered_parameters =  {'envelope': envelope, 'levy_seed': levy_seed, 'params' : params}
        
        print('gmm fit finished')
    
    def fit_cl(self,input_values, envelope, levy_seed, lags,  cl_optimisation_params = 
               {'nr_steps_optimisation' : 25,'nr_mc_samples'  : 10**4,  'nr_repetitions' : 5},
               initial_guess = None):
        
        assert isinstance(lags,tuple) and all(isinstance(i,int) for i in lags)
        print('cl fit started')
        print('cl fit finished')

        pass
    
    
    def predict(self,input_values, steps_ahead, deterministic, max_gaussian_lag = 1.0, nr_samples = None):
        
        #input_values = self.values[:,starting_index:]
        assert isinstance(input_values,np.ndarray) and len(input_values.shape) == 2
        assert deterministic  in [True,False]
        
        ##get the fitted parameters for teh envelope and for the levy seed from the attribute self.infered_parameters

        envelope         = self.infered_parameters['envelope']
        levy_seed        = self.infered_parameters['levy_seed']
        envelope_params  = self.infered_parameters['params']['envelope_params']
        levy_seed_params = self.infered_parameters['params']['levy_seed_params']
        nr_simulations, simulation_length = input_values.shape                                       
        d={}
        
        if levy_seed == 'gaussian':
            assert isinstance(max_gaussian_lag,int) and max_gaussian_lag > 0 and input_values.shape[-1] >= max_gaussian_lag
        
        for nr_steps_ahead in steps_ahead:
            
          if deterministic == True:
              
              array_to_add = np.zeros([nr_simulations,simulation_length - int((max_gaussian_lag - 1)) * (levy_seed == 'gaussian')])
              
          elif deterministic == False:
              
              array_to_add = np.zeros([nr_simulations, simulation_length - int((max_gaussian_lag - 1)) *(levy_seed == 'gaussian'),
                                       nr_samples])

          for i in range(nr_simulations):
              #to deal with gaussian lag helper
              
              if deterministic == True: 
                  array_to_add[i] = deterministic_forecasting(tau = self.tau, nr_steps_ahead =  nr_steps_ahead ,
                                    values = input_values[i], levy_seed = levy_seed, levy_seed_params = levy_seed_params[i],
                                    envelope = envelope, envelope_params = envelope_params[i], 
                                    envelope_function = None, max_gaussian_lag = max_gaussian_lag)
                        
              elif deterministic == False:
                  print(i)

                  array_to_add[i] = probabilistic_forecasting(tau = self.tau, nr_steps_ahead = nr_steps_ahead, values = input_values[i],
                                    levy_seed = levy_seed, levy_seed_params = levy_seed_params[i],
                                    envelope = envelope, envelope_params = envelope_params[i], nr_samples =  nr_samples,
                                    envelope_function = None, max_gaussian_lag = max_gaussian_lag)
          
          d[nr_steps_ahead] =  array_to_add       
                  
        return d
                    
                    
            
            #if type_ == 'deterministic':
            #    deterministic_forecasting(tau_ahead,values,levy_seed,levy_seed_params,envelope,
             #                                     envelope_params, nr_samples, envelope_function = None)
            
            #elif type__ == 'probabilistic':
            #    pass
    
    def fit_predict(self,steps_ahead,deterministic,fitting_method,envelope,levy_seed,lags,
                    initial_training_window,refit,refit_freq=None,initial_guess = None, 
                    cl_optimisation_params =  
                    {'nr_steps_optimisation' : 25,'nr_mc_samples'  : 10**4,  'nr_repetitions' : 5},
                    max_gaussian_lag = None, nr_samples=None):
        
        #check inputs 
        assert all(isinstance(x, int) and x >0 for x in steps_ahead)
        assert deterministic in [True,False]
        assert fitting_method in ['gmm','cl']
        assert refit in [True,False]  
        if refit == True:
            assert refit_freq >0 and isinstance(refit_freq,int)
            
        assert isinstance(lags,tuple)  and all(isinstance(i,int) for i in lags)
        assert isinstance(initial_training_window,int) and  initial_training_window > 0 
        if fitting_method == 'cl':
            assert set(self.infered_parameters.keys()) == {'nr_mc_samples', 'nr_repetitions', 'nr_steps_optimisation'}
            assert all((isinstance(x,int) and x > 0)  for x in self.intered_parameters.values())
        if deterministic == False:
            assert isinstance(nr_samples,int) and nr_samples > 0

            
        if fitting_method == 'gmm':
            self.fit_gmm(input_values = self.values[:,:initial_training_window],envelope = envelope,
                         levy_seed = levy_seed, lags = lags, initial_guess = initial_guess)
            
        elif fitting_method == 'cl':
            self.fit_cl(input_values = self.values[:,:initial_training_window],
                        envelope = envelope, levy_seed = levy_seed, lags = lags,cl_optimisation_params = 
                        {'nr_steps_optimisation' : 25,'nr_mc_samples'  : 10**4,  'nr_repetitions' : 5},
                        initial_guess = None)
                
        if refit == False:   
            
            return self.predict(input_values = self.values[:,:initial_training_window], steps_ahead = steps_ahead,
                             deterministic = deterministic, max_gaussian_lag = max_gaussian_lag,
                             nr_samples = nr_samples)
            
        elif refit == True:
            
            raise ValueError('not yet implemented')

Classes

class trawl (nr_simulations, nr_trawls=None, trawl_function=None, tau=None, decorrelation_time=-inf, mesh_size=None, times_grid=None, truncation_grid=None, gaussian_part_params=(0, 0), jump_part_name=None, jump_part_params=None, cpp_times=None, cpp_truncation=None, cpp_part_name=None, cpp_part_params=None, cpp_intensity=None, custom_sampler=None, values=None)

Please consult the Trawl processes example usage jupyter notebook from https://github.com/danleonte/Ambit_Stochastics to see a practical example with detailed explanations.

The implemented simulation algorithms are the grid, slice and cpp algorithms, as described in [paper link]. Parameter inference and forecasting methods to be added.

The arguments required for the simulate method are nr_simulations and trawl_function. Further, the slice method requires nr_trawls, tau, decorrelation_time, gaussian_part_params, jump_part_name,jump_part_params, the grid method requires mesh_size,times_grid,truncation_grid, gaussian_part_params,jump_part_name,jump_part_params and the cpp method requires cpp_truncation,,cpp_part_name, cpp_times cpp_part_params, cpp_intensity and custom_sampler.

Args

The following parameters are for any of simulation algorithms.

nr_simulations: positive integer: number of simulations of the trawl process.
trawl_function: a non-negative, continuous, strictly increasing function $\phi \colon (-\infty,0] \to [0,\infty)$ with $\phi(0) >0, \phi(t) =0$ for $t>0$ .

The following parameters are for both the slice and grid simulation methods.

gaussian_part_params: tuple with the mean and standard deviation of the Gaussian Part
jump_part_name: tuple with the parameters of the jump part distribution check helpers.sampler for the parametrisation.
jump_part_params: string: name of the jump part distribution. check helpers.sampler for the parametrisation.

The following parameters are for the slice simulation method.

nr_trawls: positive integer: number of ambit sets on the time axis.
tau: positive number: spacing between ambit sets on the time axis; the times at which we simulate the trawl processes are then $\tau, \ldots,\text{nr_trawls} \ \tau$ .
decorrelation_time: $-\infty$ if the ambit set A is unbounded and finite, negative otherwise. For example, if $\phi(x) = (1+x)(x>-1)(x<=0)$ , decorrelation_time =-1.

The following parameters are for the grid simulation method.

mesh_size: positive float, side-length of each cell.
times_grid: array: times at which to simulate the trawl process, necessarly in increasing order.
truncation_grid: strictly negative float: in the grid simulation method, we simulate the parts of the ambit sets contained in $t > \text{truncation_grid} + \text{min(times_grid)}$ .

The following parameters are for both the cpp simulation methods.

cpp_times: array: times at which to simulate the trawl process.
cpp_truncation: strictly negative float: we simulate the parts of the ambit sets contained in $t > \text{cpp_truncation} + \text{min(cpp_times)}$ .
cpp_part_name: to add
cpp_part_params: to add
cpp_intensity: to add
custom_sampler: to add
values: a numpy array with shape $[\text{nr_simulations},k_s,k_t]$ which is passed by the user or simulated with the method simple_ambit_field.simulate.

Expand source code

class trawl:
    def __init__(self,nr_simulations,nr_trawls = None, trawl_function=None, tau = None, 
                decorrelation_time = -np.inf, mesh_size = None, times_grid = None, 
                truncation_grid = None, gaussian_part_params= (0,0), jump_part_name=None,
                jump_part_params= None, cpp_times = None, cpp_truncation = None, cpp_part_name = None, cpp_part_params = None,
                cpp_intensity = None, custom_sampler = None, values=None):
        """Please consult the `Trawl processes example usage` jupyter notebook from https://github.com/danleonte/Ambit_Stochastics
        to see a practical example with detailed explanations.
        
        The implemented simulation algorithms are the grid, slice and cpp algorithms, as described in [paper link]. Parameter inference and forecasting methods to be added.

        The arguments required for the `simulate` method are `nr_simulations` and `trawl_function`.
        Further, the slice method requires `nr_trawls`,
        `tau`, `decorrelation_time`, `gaussian_part_params`, `jump_part_name`,`jump_part_params`,
         the grid method requires
        `mesh_size`,`times_grid`,`truncation_grid`, `gaussian_part_params`,`jump_part_name`,`jump_part_params` and
         the cpp method requires `cpp_truncation,`,`cpp_part_name`, `cpp_times`
        `cpp_part_params`, `cpp_intensity` and `custom_sampler`.
               
        Args:
          The following parameters are for any of simulation algorithms.
          
          nr_simulations: positive integer: number of simulations of the trawl process.
          trawl_function: a non-negative, continuous, strictly increasing function \(\phi \colon (-\infty,0] \\to [0,\infty)\) with \(\phi(0) >0, \phi(t) =0\) for \(t>0\).

          The following parameters are for both the slice and grid simulation methods.
          
          gaussian_part_params: tuple with the mean and standard deviation of the Gaussian Part
          jump_part_name: tuple with the parameters of the jump part distribution check `helpers.sampler` for the parametrisation.
          jump_part_params: string: name of the jump part distribution. check `helpers.sampler` for the parametrisation.

          The following parameters are for the slice simulation method.
          
          nr_trawls: positive integer: number of ambit sets on the time axis.
          tau: positive number: spacing between ambit sets on the time axis; the times at which we simulate the trawl processes are then \(\\tau, \\ldots,\\text{nr_trawls} \ \\tau\).
          decorrelation_time: \(-\infty\) if the ambit set A is unbounded and finite, negative otherwise. For example, if \(\phi(x) = (1+x)(x>-1)(x<=0)\), `decorrelation_time =-1`.
      
          The following parameters are for the grid simulation method.

          mesh_size: positive float, side-length of each cell.
          times_grid: array: times at which to simulate the trawl process, necessarly in increasing order.
          truncation_grid: strictly negative float: in the grid simulation method, we simulate the parts of the ambit sets contained in \(t > \\text{truncation_grid} + \\text{min(times_grid)}\).

          The following parameters are for both the cpp simulation methods.

          cpp_times: array: times at which to simulate the trawl process.
          cpp_truncation: strictly negative float: we simulate the parts of the ambit sets contained in \(t > \\text{cpp_truncation} + \\text{min(cpp_times)}\).
          cpp_part_name: to add
          cpp_part_params: to add
          cpp_intensity: to add
          custom_sampler: to add
              
          values: a numpy array with shape \([\\text{nr_simulations},k_s,k_t]\) which is passed by the user or simulated with the method `simple_ambit_field.simulate`.
         """
       
        #general attributes
        self.nr_simulations  = nr_simulations
        #attributes required for simulation
        self.trawl_function                 = trawl_function
        
        #########################################################################
        ### attributes required for both grid and slice simulation algorithms ###
        
        # distributional parameters of the gaussian and jump parts of the levy seed 
        # jump_part_name and jump_part_params are also requried for the grid method
        
        self.gaussian_part_params           = gaussian_part_params
        self.jump_part_name                 = jump_part_name
        self.jump_part_params               = jump_part_params

        
        #############################################################################     
        ### attributes required only for the slice partition simulation algorithm ###  
   
        self.nr_trawls                      = nr_trawls
        self.tau                            = tau
        self.decorrelation_time             = decorrelation_time
        self.I                              = None
        self.slice_areas_matrix             = None

        
        ################################################################## 
        ### attributes required only for the grid simulation algorithm ###
        
        self.times_grid               = times_grid
        self.truncation_grid          = truncation_grid       
        self.mesh_size                = mesh_size
        self.times_grid               = times_grid
        self.vol                      = None
        
        #self.indicator_matrix               = None
        
        ################################################################## 
        ### attributes required only for the cpp simulation algorithm  ###
        
        self.cpp_truncation  = cpp_truncation
        self.cpp_part_name   = cpp_part_name 
        self.cpp_part_params = cpp_part_params
        self.cpp_intensity   = cpp_intensity
        self.custom_sampler  = custom_sampler
        self.cpp_times       = cpp_times
            
        ### arrays containing the gaussian, jump and cpp parts of the simulation
        self.gaussian_values          =   None 
        self.jump_values              =   None 
        self.cpp_values               =   None 
        
        ### passed by the user or to be simulated using one of the simulation methods ### 
        self.values                   =   values 
        
        #if the values are passed by the use and not simulated
        if values is not None:
            self.nr_simulations, self.nr_tralws = self.values.shape
            
             
        #############################################################################     
        ### attributes required only for the parameter inference ###  
        self.infered_parameters   = None
        # {'envelope': exponential, 'levy_seed': 'gamma', 'params' : 
        #    {'envelope_params': tuple of tuples , 'levy_seed_params': tuple of tuples}}
        
    ######################################################################
    ###  Simulation algorithms:      I slice, II grid, III cpp         ###
    ######################################################################
    
    
       ########################### I Slice ###########################

    
    def compute_slice_areas_finite_decorrelation_time(self):
        """Computes the \(I \\times k\) matrix 
        
        \[\\begin{bmatrix}
              a_0     &  a_0 - a_1          \\ldots  & a_0 - a_1          \\\\
              a_1     &  a_1 - a_2          \\ldots  & a_1 - a_2          \\\\
              a_2     &  a_2 - a_3          \\ldots  & a_2 - a_3          \\\\
                      &                     \\vdots  &                    \\\\
              a_{k-2} & a_{k-2} - a_{k-1}   \\ldots  & a_{k-2} - a_{k-1}  \\\\
              a_{k-1} & a_{k-1}                      & a_{k-1}            
        \\end{bmatrix}\]
        
        corresponding to the areas of the slices 
        
                
        \[\\begin{bmatrix}
        L(S_{11})  & \\ldots & L(S_{1,k-1}) & L(S_{1k}) \\\\
        L(S_{21})  &  \\ldots &  L(S_{2,k-1}) & L(S_{2k}) \\\\
         \\vdots &       &  \\vdots  & \\vdots  \\\\
        L(S_{I1}) &  \\ldots &  L(S_{I,k-1}) & L(S_{I,k})
        \\end{bmatrix}
        \]
            
        where \(k =\) `self.nr_trawls` and 
        
        \[\\begin{align}
        a_0 &= \int_{-\\tau}^0 \phi(u)du, \\\\
            \\vdots & \\\\
        a_{k-2} &= \int_{(-k+1)\\tau} ^{(-k+2)  \\tau} \phi(u) du, \\\\
        a_{k-1} &= \int_{\\text{decorrelation_time}}^{(-k+1)\\tau} \phi(u)du.
        \\end{align} 
        \]            
            """
        self.I = math.ceil(-self.decorrelation_time/self.tau)
        
        s_i1 = [quad(self.trawl_function,a=-i *self.tau, b = (-i+1) * self.tau)[0]
                for i in range(1,self.I+1)]
        s_i2 = np.append(np.diff(s_i1[::-1])[::-1],s_i1[-1])
        
        right_column = np.tile(s_i2[:,np.newaxis],(1,self.nr_trawls-1))
        left_column  = left_column  = (np.array(s_i1))[:,np.newaxis]
        self.slice_areas_matrix  = np.concatenate([left_column,right_column],axis=1)
        
        #to add I-1 columns of length I zeros
        #check entire program here and comapre with previous versions
                
    
    def compute_slice_areas_infinite_decorrelation_time(self):
        """Computes the  \(k \\times k\) matrix  
        
        \[\\begin{bmatrix}
              a_0     &  a_0 - a_1  & a_0 - a_1  &    \\ldots  & a_0 - a_1  & a_0 - a_1  & a_0 \\\\
              a_1     &  a_1 - a_2  & a_1 - a_2  &    \\ldots  & a_1 - a_2  & a_1        & 0   \\\\
              a_2     &  a_2 - a_3  & a_2 - a_3  &    \\ldots  & a_2        & 0          & 0   \\\\
                      &             &            &    \\vdots  &            &            &     \\\\
              a_{k-2} & a_{k-1}     & 0          &    \\ldots  &  0         & 0          & 0   \\\\
              a_{k-1} & 0           & 0          &             &  0         & 0          & 0
        \\end{bmatrix}\]
            
        corresponding to the areas of the slices 
        
                
        \[\\begin{bmatrix}
        L(S_{11})  & \\ldots & L(S_{1k,-1}) & L(S_{1k}) \\\\
        L(S_{21})  &  \\ldots &  L(S_{2,k-1}) & 0 \\\\
         \\vdots &       &  \\vdots  & \\vdots  \\\\
        L(S_{k1}) &  \\ldots &  0 & 0
        \\end{bmatrix}
        \]
         
        
        where \(k =\) `self.nr_trawls` and 
        
        \[\\begin{align}
        a_0 &= \int_{-\\tau}^0 \phi(u)du, \\\\
            \\vdots & \\\\
        a_{k-2} &= \int_{(-k+1)\\tau} ^{(-k+2)  \\tau} \phi(u) du, \\\\
        a_{k-1} &= \int_{-\infty}^{(-k+1)\\tau} \phi(u)du.
        \\end{align} 
        \]
        """
        s_i1 =  [quad(self.trawl_function,a=-i *self.tau, b = (-i+1) * self.tau)[0]
                 for i in range(1,self.nr_trawls)] + [quad(self.trawl_function,a=-np.inf,
                                                           b=(-self.nr_trawls+1)*self.tau)[0]]
        
                                                           
        #  a[0] -a[1] ,a[1] -a[2], ... , a[k-2] - a[k-1] , 0
        differences   = np.append(np.diff(s_i1[::-1])[::-1],0) 

        left_column  = np.array(s_i1)[:,np.newaxis]  
        right_column = np.zeros((self.nr_trawls,1))
        #we reconstruct the elements on the secondary diagonal at the end
        
                                                     
        middle_matrix = np.tile(differences[:,np.newaxis],(1,self.nr_trawls-2))
        whole_matrix  = np.concatenate([left_column,middle_matrix,right_column],axis=1)
        whole_matrix_reversed   = np.triu(np.fliplr(whole_matrix), k=0)
        np.fill_diagonal(whole_matrix_reversed,s_i1)     

        self.slice_areas_matrix = np.fliplr(whole_matrix_reversed)
    
    def simulate_slice_finite_decorrelation_time(self,slice_convolution_type):
        """helper for the `simulate_slice` method"""
        
        filter_ = np.fliplr(np.tril(np.ones(self.I),k=0)) 
        zero_matrix  = np.zeros([self.I,self.I-1])

        for simulation_nr in range(self.nr_simulations):
            gaussian_slices = gaussian_part_sampler(self.gaussian_part_params,self.slice_areas_matrix) 
            jump_slices     = jump_part_sampler(self.jump_part_params,self.slice_areas_matrix,self.jump_part_name)
            
            if slice_convolution_type == 'fft':
        
                gaussian_slices = np.concatenate([zero_matrix,gaussian_slices],axis=1)
                jump_slices = np.concatenate([zero_matrix,jump_slices],axis=1)
        
                #matrix with 1's on and below the secondary diagonal
                #flip the filter to agree with np convention
                self.gaussian_values[simulation_nr,:] = convolve2d(gaussian_slices,filter_[::-1,::-1],'valid')[0]
                self.jump_values[simulation_nr,:]     = convolve2d(jump_slices,filter_[::-1,::-1],'valid')[0]
        
            elif slice_convolution_type == 'diagonals':
                
                self.gaussian_values[simulation_nr,:] = cumulative_and_diagonal_sums(gaussian_slices)
                self.jump_values[simulation_nr,:] =  cumulative_and_diagonal_sums(jump_slices)
                
                
    def simulate_slice_infinite_decorrelation_time(self,slice_convolution_type):
        """Helper for the `simulate_slice` method."""

        zero_matrix     = np.zeros([self.nr_trawls,self.nr_trawls-1])
        filter_         = np.fliplr(np.tril(np.ones(self.nr_trawls),k=0)) 


        for simulation_nr in range(self.nr_simulations):
            
            gaussian_slices = gaussian_part_sampler(self.gaussian_part_params,self.slice_areas_matrix) 
            
            #the lower triangular part of the matrix is made oup of 0's, which can result in an error
            #in the scipy.stats sampler (for example, if the levy seed is gamma)
            #to prevent this, we extract the upper triangular part of the matrix as a vector
            #sample this way, then recast the samples as an upper triangular matrix
            slice_areas_row   = (np.fliplr(self.slice_areas_matrix))[np.triu_indices(self.slice_areas_matrix.shape[0], k = 0)]
            jump_slices_row   = jump_part_sampler(self.jump_part_params,slice_areas_row,self.jump_part_name)
            jump_slices       = np.zeros(gaussian_slices.shape)
            jump_slices[np.triu_indices(jump_slices.shape[0], k = 0)]     = jump_slices_row
            jump_slices       = np.fliplr(jump_slices)
             

            if slice_convolution_type == 'fft':
                gaussian_slices = np.concatenate([zero_matrix,gaussian_slices],axis=1)
                jump_slices     = np.concatenate([zero_matrix,jump_slices],axis=1)
                
                self.gaussian_values[simulation_nr,:] = convolve2d(gaussian_slices,filter_[::-1,::-1],'valid')[0]
                self.jump_values[simulation_nr,:]     = convolve2d(jump_slices,filter_[::-1,::-1],'valid')[0]
                
            elif slice_convolution_type == 'diagonals':
                
                self.gaussian_values[simulation_nr,:] = cumulative_and_diagonal_sums(gaussian_slices)
                self.jump_values[simulation_nr,:] =  cumulative_and_diagonal_sums(jump_slices)
        
        
    def simulate_slice(self,slice_convolution_type):
        """implements algorithm [] from [] and simulates teh trawl process at 
        \(\\tau,\\ldots,\\text{nr_trawls}\ \\tau\). `slice_convolution_type` can be either [to add]"""
        if self.decorrelation_time == -np.inf:
            self.compute_slice_areas_infinite_decorrelation_time()
            self.simulate_slice_infinite_decorrelation_time(slice_convolution_type)
             
        elif self.decorrelation_time > -np.inf:
            assert(self.trawl_function(self.decorrelation_time)) == 0,'please check decorrelation time' 
            self.compute_slice_areas_finite_decorrelation_time()
            self.simulate_slice_finite_decorrelation_time(slice_convolution_type)
        #self.values = self.gaussian_values + self.jump_values

                      
       ############################ II Grid ############################
    
    def grid_creation(self,min_t,max_t):
        """Creates a grid on \([0,\phi(0)] \\times [\\text{min_t}, \\text{max_t}]\). Each cell is represented by 
        the coordinates of its bottom left corner. To each cell we associate a sample from each of the gaussian
        and jump parts of the trawl process.
        
        Returns:
          gaussian_values:  array with the Gaussian of the Levy basis evaluated over the cells  
          jump_values: array with the jump part of the Levy basis evaluated over the cells      
        """
            
        coords = np.mgrid[0:self.trawl_function(0):self.mesh_size,min_t:max_t:self.mesh_size]
        x, t   = coords[0].flatten(), coords[1].flatten() 
        
        areas            = self.vol * np.ones([self.nr_simulations,len(t)])
        gaussian_values  = gaussian_part_sampler(self.gaussian_part_params,areas)
        jump_values      = jump_part_sampler(self.jump_part_params,areas,self.jump_part_name)
        
            
        return x,t,gaussian_values,jump_values
    
    def grid_update(self,i,t,gaussian_values,jump_values):
        """Inputs the values of the Levy basis evaluated over the grid cells on \([\\tau_{i-1}+\\text{truncation_grid},\\tau_{i-1}] \\times [0,\\phi(0)]\),
        removes the values corresponding to cells with time coordinates less than \(\\tau_{i} + \\text{truncation_grid}\) and adds new samples
        for the levy basis evaluated over the grid cells with time coordinates in \([\\tau_{i-1},\\tau_i]\) (see figure). 
        Assumes that the consecutive ambit sets at times \(\\tau_{i-1},\\tau_i\) are not disjoint, i.e.
        \(\\tau_i + \\text{truncation_grid} < \\tau_{i-1}\).
        
        Args:
          i: index of the trawl to be simulated
          t: time coordinates of the cells of the grid on \([\\tau_{i-1},\\tau_{i-1}+\\text{truncation_grid}] \\times [0,\phi(0)]\)
          gaussian_values: gaussian values for the grid on \([\\tau_{i-1},\\tau_{i-1}+\\text{truncation_grid}] \\times [0,\phi(0)]\)
          jump_values: jump values for the grid on \([\\tau_{i-1},\\tau_{i-1}+\\text{truncation_grid}] \\times [0,\phi(0)\)
        
        Returns:
          gaussian_values: gaussian values for the grid cells on \([\\tau_{i},\\tau_{i}+\\text{truncation_grid}] \\times [0,\phi(0)]\)
          jump_values: jump values for the grid cells on \([\\tau_{i},\\tau_{i}+\\text{truncation_grid}] \\times [0,\phi(0)]\)                                                                                                                                                                                                
         """
          

        ind_to_keep       =  t >= (self.times_grid[i] + self.truncation_grid)
        t[~ind_to_keep]  += -self.truncation_grid
        
        areas             = self.vol * np.ones([self.nr_simulations,sum(~ind_to_keep)])
        #print(gaussian_values[:,~ind_to_keep].shape)
        #print(self.gaussian_part_sampler(areas).shape)
        gaussian_values[:,~ind_to_keep] = gaussian_part_sampler(self.gaussian_part_params,areas)
        jump_values[:,~ind_to_keep]     = jump_part_sampler(self.jump_part_params,areas,self.jump_part_name)  
        #print('ind to keep sum is ', ind_to_keep.sum())
        #print('gaussian is ',gaussian_values.shape)
        #print('non_gaussian_values ',non_gaussian_values[:,ind_to_keep].shape)
        #print('new_gaussian_values ',new_gaussian_values.shape)
        #print('t new shape is ',t.shape)
        #print('x shape is', x.shape)
        
        return t,gaussian_values,jump_values   
    
    
    def simulate_grid(self):
        """Simulate the trawl proces at times `self.times_grid`, which don't have to be
        equally distant, via the grid method."""
        
        #If `times_grid` are equidistnant, we do not need to compute `indicators` at each iteration, speeding up the process        

        for i in range(len(self.times_grid)):
             if (i==0) or (self.times_grid[i-1] <= self.times_grid[i] + self.truncation_grid):
                 #check that we are creating the grid for the first time or that 
                 #trawls at time i-1 and i have empty intersection
                 x,t,gaussian_values, jump_values = self.grid_creation(self.times_grid[i] + self.truncation_grid, self.times_grid[i])

                
             elif self.times_grid[i-1] > self.times_grid[i] + self.truncation_grid:
                 #check that we have non empty intersection and update the grid
                 t,gaussian_values,jump_values = self.grid_update(i,t,gaussian_values,jump_values)
            
             indicators = x < self.trawl_function(t-self.times_grid[i])
             #print(gaussian_values.shape,indicators.shape)
             self.gaussian_values[:,i]  = gaussian_values @ indicators
             self.jump_values[:,i]      = jump_values @ indicators
             
        #self.values = self.gaussian_values + self.jump_values
       ########################### III cpp ###########################
#    @njit   
    def simulate_cpp(self):
        """ text to be added"""
        min_t = min(self.cpp_times) + self.cpp_truncation
        max_t = max(self.cpp_times)
        min_x = 0
        max_x = self.trawl_function(0)
        
        for simulation_nr in range(self.nr_simulations):
            
        
            points_x, points_t, associated_values = generate_cpp_points(min_x = min_x, max_x = max_x, 
                        min_t = min_t, max_t = max_t, cpp_part_name = self.cpp_part_name,
                        cpp_part_params = self.cpp_part_params, cpp_intensity = self.cpp_intensity,
                        custom_sampler = self.custom_sampler)
                                    
            #(x_i,t_i) in A_t if t < t_i and x_i < phi(t_i-t)
            indicator_matrix = np.tile(points_x[:,np.newaxis],(1,self.nr_trawls)) < \
                            self.trawl_function(np.subtract.outer(points_t, self.cpp_times))
            self.cpp_values[simulation_nr,:] = associated_values @ indicator_matrix
                            
        
       ####################### simulate meta-method #######################
    def simulate(self,method,slice_convolution_type='diagonals'):
         """Function to simulate from the trawl function. Contains sanity checks
         for the simulation parameters and uses helper functions for each simulation
         method.
         
         Args:
           method: one of the strings `cpp`, `grid` or `slice`
           slice_convolution_type: if method is set to `slice`, this can be one of the strings `diagonals` or `ftt`, depending on the way we add up the simulated slices. This argument is ignored if method is set to `grid` or `cpp`."""

         #general checks
         assert isinstance(self.nr_simulations,int) and self.nr_simulations >0
         assert method in {'cpp','grid','slice'},'simulation method not supported'
         check_trawl_function(self.trawl_function)
         check_gaussian_params(self.gaussian_part_params)
         
         
         #algorithm specific checks and attribute setting
         if method == 'grid':
             check_jump_part_and_params(self.jump_part_name,self.jump_part_params)
             check_grid_params(self.mesh_size,self.truncation_grid,self.times_grid)
             
             self.nr_trawls = len(self.times_grid)
             self.vol = self.mesh_size **2
             
         elif method == 'cpp':
             check_cpp_params(self.cpp_part_name, self.cpp_part_params,self.cpp_intensity,self.custom_sampler)

             self.nr_trawls = len(self.cpp_times)
                 
         elif method == 'slice':
             assert slice_convolution_type in {'fft','diagonals'}
             assert isinstance(self.nr_trawls,int) and self.nr_trawls > 0,'nr_trawls should be a  strictly positive integer'
             check_jump_part_and_params(self.jump_part_name,self.jump_part_params)

             
         self.gaussian_values          =   np.zeros(shape = [self.nr_simulations,self.nr_trawls]) 
         self.jump_values              =   np.zeros(shape = [self.nr_simulations,self.nr_trawls])
         self.cpp_values               =   np.zeros(shape = [self.nr_simulations,self.nr_trawls])
        
        
         if method == 'grid':
             self.simulate_grid()
         elif method == 'cpp':
             self.simulate_cpp()
         elif method == 'slice':
             self.simulate_slice(slice_convolution_type)    

         self.values = self.gaussian_values + self.jump_values + self.cpp_values
         
             
    def theoretical_acf(self,t_values):
        """Computes the theoretical acf of the trawl process
        
        Args:
          t_values: array of time values 
        
        Returns:
          d_acf: a dictionary of the type  \(t: \\text{corr}(X_0,X_t)\), where \(t\) ranges over the input array `t_values`. 
        """
        total_area = quad(self.trawl_function,a=-np.inf,b= 0)[0]
        d_acf=dict()
        for t in t_values:
            d_acf[t] = quad(self.trawl_function,a=-np.inf,b= -t)[0]/total_area
        return d_acf
                  

             
    ######################################################################
    ###  Forecasting:      determinstic and probabilistic              ###
    ######################################################################
    
    
    def fit_gmm(self,input_values,envelope,levy_seed,lags,initial_guess=None):

        
        assert isinstance(lags,tuple) and all(isinstance(i,int) for i in lags)
        
        print('gmm fit started')
        
        envelope_params  = fit_trawl_envelope_gmm(self.tau,input_values,lags,envelope,initial_guess)
        levy_seed_params = fit_trawl_marginal(input_values,levy_seed)
        params =  {'envelope_params':envelope_params,'levy_seed_params': levy_seed_params}
        self.infered_parameters =  {'envelope': envelope, 'levy_seed': levy_seed, 'params' : params}
        
        print('gmm fit finished')
    
    def fit_cl(self,input_values, envelope, levy_seed, lags,  cl_optimisation_params = 
               {'nr_steps_optimisation' : 25,'nr_mc_samples'  : 10**4,  'nr_repetitions' : 5},
               initial_guess = None):
        
        assert isinstance(lags,tuple) and all(isinstance(i,int) for i in lags)
        print('cl fit started')
        print('cl fit finished')

        pass
    
    
    def predict(self,input_values, steps_ahead, deterministic, max_gaussian_lag = 1.0, nr_samples = None):
        
        #input_values = self.values[:,starting_index:]
        assert isinstance(input_values,np.ndarray) and len(input_values.shape) == 2
        assert deterministic  in [True,False]
        
        ##get the fitted parameters for teh envelope and for the levy seed from the attribute self.infered_parameters

        envelope         = self.infered_parameters['envelope']
        levy_seed        = self.infered_parameters['levy_seed']
        envelope_params  = self.infered_parameters['params']['envelope_params']
        levy_seed_params = self.infered_parameters['params']['levy_seed_params']
        nr_simulations, simulation_length = input_values.shape                                       
        d={}
        
        if levy_seed == 'gaussian':
            assert isinstance(max_gaussian_lag,int) and max_gaussian_lag > 0 and input_values.shape[-1] >= max_gaussian_lag
        
        for nr_steps_ahead in steps_ahead:
            
          if deterministic == True:
              
              array_to_add = np.zeros([nr_simulations,simulation_length - int((max_gaussian_lag - 1)) * (levy_seed == 'gaussian')])
              
          elif deterministic == False:
              
              array_to_add = np.zeros([nr_simulations, simulation_length - int((max_gaussian_lag - 1)) *(levy_seed == 'gaussian'),
                                       nr_samples])

          for i in range(nr_simulations):
              #to deal with gaussian lag helper
              
              if deterministic == True: 
                  array_to_add[i] = deterministic_forecasting(tau = self.tau, nr_steps_ahead =  nr_steps_ahead ,
                                    values = input_values[i], levy_seed = levy_seed, levy_seed_params = levy_seed_params[i],
                                    envelope = envelope, envelope_params = envelope_params[i], 
                                    envelope_function = None, max_gaussian_lag = max_gaussian_lag)
                        
              elif deterministic == False:
                  print(i)

                  array_to_add[i] = probabilistic_forecasting(tau = self.tau, nr_steps_ahead = nr_steps_ahead, values = input_values[i],
                                    levy_seed = levy_seed, levy_seed_params = levy_seed_params[i],
                                    envelope = envelope, envelope_params = envelope_params[i], nr_samples =  nr_samples,
                                    envelope_function = None, max_gaussian_lag = max_gaussian_lag)
          
          d[nr_steps_ahead] =  array_to_add       
                  
        return d
                    
                    
            
            #if type_ == 'deterministic':
            #    deterministic_forecasting(tau_ahead,values,levy_seed,levy_seed_params,envelope,
             #                                     envelope_params, nr_samples, envelope_function = None)
            
            #elif type__ == 'probabilistic':
            #    pass
    
    def fit_predict(self,steps_ahead,deterministic,fitting_method,envelope,levy_seed,lags,
                    initial_training_window,refit,refit_freq=None,initial_guess = None, 
                    cl_optimisation_params =  
                    {'nr_steps_optimisation' : 25,'nr_mc_samples'  : 10**4,  'nr_repetitions' : 5},
                    max_gaussian_lag = None, nr_samples=None):
        
        #check inputs 
        assert all(isinstance(x, int) and x >0 for x in steps_ahead)
        assert deterministic in [True,False]
        assert fitting_method in ['gmm','cl']
        assert refit in [True,False]  
        if refit == True:
            assert refit_freq >0 and isinstance(refit_freq,int)
            
        assert isinstance(lags,tuple)  and all(isinstance(i,int) for i in lags)
        assert isinstance(initial_training_window,int) and  initial_training_window > 0 
        if fitting_method == 'cl':
            assert set(self.infered_parameters.keys()) == {'nr_mc_samples', 'nr_repetitions', 'nr_steps_optimisation'}
            assert all((isinstance(x,int) and x > 0)  for x in self.intered_parameters.values())
        if deterministic == False:
            assert isinstance(nr_samples,int) and nr_samples > 0

            
        if fitting_method == 'gmm':
            self.fit_gmm(input_values = self.values[:,:initial_training_window],envelope = envelope,
                         levy_seed = levy_seed, lags = lags, initial_guess = initial_guess)
            
        elif fitting_method == 'cl':
            self.fit_cl(input_values = self.values[:,:initial_training_window],
                        envelope = envelope, levy_seed = levy_seed, lags = lags,cl_optimisation_params = 
                        {'nr_steps_optimisation' : 25,'nr_mc_samples'  : 10**4,  'nr_repetitions' : 5},
                        initial_guess = None)
                
        if refit == False:   
            
            return self.predict(input_values = self.values[:,:initial_training_window], steps_ahead = steps_ahead,
                             deterministic = deterministic, max_gaussian_lag = max_gaussian_lag,
                             nr_samples = nr_samples)
            
        elif refit == True:
            
            raise ValueError('not yet implemented')

Methods

def compute_slice_areas_finite_decorrelation_time(self)

Computes the $I \times k$ matrix

$\begin{bmatrix} a_0 & a_0 - a_1 \ldots & a_0 - a_1 \\ a_1 & a_1 - a_2 \ldots & a_1 - a_2 \\ a_2 & a_2 - a_3 \ldots & a_2 - a_3 \\ & \vdots & \\ a_{k-2} & a_{k-2} - a_{k-1} \ldots & a_{k-2} - a_{k-1} \\ a_{k-1} & a_{k-1} & a_{k-1} \end{bmatrix}$

corresponding to the areas of the slices

$\begin{bmatrix} L(S_{11}) & \ldots & L(S_{1,k-1}) & L(S_{1k}) \\ L(S_{21}) & \ldots & L(S_{2,k-1}) & L(S_{2k}) \\ \vdots & & \vdots & \vdots \\ L(S_{I1}) & \ldots & L(S_{I,k-1}) & L(S_{I,k}) \end{bmatrix}$

where $k =$ self.nr_trawls and

$\begin{align} a_0 &= \int_{-\tau}^0 \phi(u)du, \\ \vdots & \\ a_{k-2} &= \int_{(-k+1)\tau} ^{(-k+2) \tau} \phi(u) du, \\ a_{k-1} &= \int_{\text{decorrelation_time}}^{(-k+1)\tau} \phi(u)du. \end{align}$

Expand source code

def compute_slice_areas_finite_decorrelation_time(self):
    """Computes the \(I \\times k\) matrix 
    
    \[\\begin{bmatrix}
          a_0     &  a_0 - a_1          \\ldots  & a_0 - a_1          \\\\
          a_1     &  a_1 - a_2          \\ldots  & a_1 - a_2          \\\\
          a_2     &  a_2 - a_3          \\ldots  & a_2 - a_3          \\\\
                  &                     \\vdots  &                    \\\\
          a_{k-2} & a_{k-2} - a_{k-1}   \\ldots  & a_{k-2} - a_{k-1}  \\\\
          a_{k-1} & a_{k-1}                      & a_{k-1}            
    \\end{bmatrix}\]
    
    corresponding to the areas of the slices 
    
            
    \[\\begin{bmatrix}
    L(S_{11})  & \\ldots & L(S_{1,k-1}) & L(S_{1k}) \\\\
    L(S_{21})  &  \\ldots &  L(S_{2,k-1}) & L(S_{2k}) \\\\
     \\vdots &       &  \\vdots  & \\vdots  \\\\
    L(S_{I1}) &  \\ldots &  L(S_{I,k-1}) & L(S_{I,k})
    \\end{bmatrix}
    \]
        
    where \(k =\) `self.nr_trawls` and 
    
    \[\\begin{align}
    a_0 &= \int_{-\\tau}^0 \phi(u)du, \\\\
        \\vdots & \\\\
    a_{k-2} &= \int_{(-k+1)\\tau} ^{(-k+2)  \\tau} \phi(u) du, \\\\
    a_{k-1} &= \int_{\\text{decorrelation_time}}^{(-k+1)\\tau} \phi(u)du.
    \\end{align} 
    \]            
        """
    self.I = math.ceil(-self.decorrelation_time/self.tau)
    
    s_i1 = [quad(self.trawl_function,a=-i *self.tau, b = (-i+1) * self.tau)[0]
            for i in range(1,self.I+1)]
    s_i2 = np.append(np.diff(s_i1[::-1])[::-1],s_i1[-1])
    
    right_column = np.tile(s_i2[:,np.newaxis],(1,self.nr_trawls-1))
    left_column  = left_column  = (np.array(s_i1))[:,np.newaxis]
    self.slice_areas_matrix  = np.concatenate([left_column,right_column],axis=1)

def compute_slice_areas_infinite_decorrelation_time(self)

Computes the $k \times k$ matrix

$\begin{bmatrix} a_0 & a_0 - a_1 & a_0 - a_1 & \ldots & a_0 - a_1 & a_0 - a_1 & a_0 \\ a_1 & a_1 - a_2 & a_1 - a_2 & \ldots & a_1 - a_2 & a_1 & 0 \\ a_2 & a_2 - a_3 & a_2 - a_3 & \ldots & a_2 & 0 & 0 \\ & & & \vdots & & & \\ a_{k-2} & a_{k-1} & 0 & \ldots & 0 & 0 & 0 \\ a_{k-1} & 0 & 0 & & 0 & 0 & 0 \end{bmatrix}$

corresponding to the areas of the slices

$\begin{bmatrix} L(S_{11}) & \ldots & L(S_{1k,-1}) & L(S_{1k}) \\ L(S_{21}) & \ldots & L(S_{2,k-1}) & 0 \\ \vdots & & \vdots & \vdots \\ L(S_{k1}) & \ldots & 0 & 0 \end{bmatrix}$

where $k =$ self.nr_trawls and

$\begin{align} a_0 &= \int_{-\tau}^0 \phi(u)du, \\ \vdots & \\ a_{k-2} &= \int_{(-k+1)\tau} ^{(-k+2) \tau} \phi(u) du, \\ a_{k-1} &= \int_{-\infty}^{(-k+1)\tau} \phi(u)du. \end{align}$

Expand source code

def compute_slice_areas_infinite_decorrelation_time(self):
    """Computes the  \(k \\times k\) matrix  
    
    \[\\begin{bmatrix}
          a_0     &  a_0 - a_1  & a_0 - a_1  &    \\ldots  & a_0 - a_1  & a_0 - a_1  & a_0 \\\\
          a_1     &  a_1 - a_2  & a_1 - a_2  &    \\ldots  & a_1 - a_2  & a_1        & 0   \\\\
          a_2     &  a_2 - a_3  & a_2 - a_3  &    \\ldots  & a_2        & 0          & 0   \\\\
                  &             &            &    \\vdots  &            &            &     \\\\
          a_{k-2} & a_{k-1}     & 0          &    \\ldots  &  0         & 0          & 0   \\\\
          a_{k-1} & 0           & 0          &             &  0         & 0          & 0
    \\end{bmatrix}\]
        
    corresponding to the areas of the slices 
    
            
    \[\\begin{bmatrix}
    L(S_{11})  & \\ldots & L(S_{1k,-1}) & L(S_{1k}) \\\\
    L(S_{21})  &  \\ldots &  L(S_{2,k-1}) & 0 \\\\
     \\vdots &       &  \\vdots  & \\vdots  \\\\
    L(S_{k1}) &  \\ldots &  0 & 0
    \\end{bmatrix}
    \]
     
    
    where \(k =\) `self.nr_trawls` and 
    
    \[\\begin{align}
    a_0 &= \int_{-\\tau}^0 \phi(u)du, \\\\
        \\vdots & \\\\
    a_{k-2} &= \int_{(-k+1)\\tau} ^{(-k+2)  \\tau} \phi(u) du, \\\\
    a_{k-1} &= \int_{-\infty}^{(-k+1)\\tau} \phi(u)du.
    \\end{align} 
    \]
    """
    s_i1 =  [quad(self.trawl_function,a=-i *self.tau, b = (-i+1) * self.tau)[0]
             for i in range(1,self.nr_trawls)] + [quad(self.trawl_function,a=-np.inf,
                                                       b=(-self.nr_trawls+1)*self.tau)[0]]
    
                                                       
    #  a[0] -a[1] ,a[1] -a[2], ... , a[k-2] - a[k-1] , 0
    differences   = np.append(np.diff(s_i1[::-1])[::-1],0) 

    left_column  = np.array(s_i1)[:,np.newaxis]  
    right_column = np.zeros((self.nr_trawls,1))
    #we reconstruct the elements on the secondary diagonal at the end
    
                                                 
    middle_matrix = np.tile(differences[:,np.newaxis],(1,self.nr_trawls-2))
    whole_matrix  = np.concatenate([left_column,middle_matrix,right_column],axis=1)
    whole_matrix_reversed   = np.triu(np.fliplr(whole_matrix), k=0)
    np.fill_diagonal(whole_matrix_reversed,s_i1)     

    self.slice_areas_matrix = np.fliplr(whole_matrix_reversed)

def fit_cl(self, input_values, envelope, levy_seed, lags, cl_optimisation_params={'nr_steps_optimisation': 25, 'nr_mc_samples': 10000, 'nr_repetitions': 5}, initial_guess=None)

Expand source code

def fit_cl(self,input_values, envelope, levy_seed, lags,  cl_optimisation_params = 
           {'nr_steps_optimisation' : 25,'nr_mc_samples'  : 10**4,  'nr_repetitions' : 5},
           initial_guess = None):
    
    assert isinstance(lags,tuple) and all(isinstance(i,int) for i in lags)
    print('cl fit started')
    print('cl fit finished')

    pass

def fit_gmm(self, input_values, envelope, levy_seed, lags, initial_guess=None)

Expand source code

def fit_gmm(self,input_values,envelope,levy_seed,lags,initial_guess=None):

    
    assert isinstance(lags,tuple) and all(isinstance(i,int) for i in lags)
    
    print('gmm fit started')
    
    envelope_params  = fit_trawl_envelope_gmm(self.tau,input_values,lags,envelope,initial_guess)
    levy_seed_params = fit_trawl_marginal(input_values,levy_seed)
    params =  {'envelope_params':envelope_params,'levy_seed_params': levy_seed_params}
    self.infered_parameters =  {'envelope': envelope, 'levy_seed': levy_seed, 'params' : params}
    
    print('gmm fit finished')

def fit_predict(self, steps_ahead, deterministic, fitting_method, envelope, levy_seed, lags, initial_training_window, refit, refit_freq=None, initial_guess=None, cl_optimisation_params={'nr_steps_optimisation': 25, 'nr_mc_samples': 10000, 'nr_repetitions': 5}, max_gaussian_lag=None, nr_samples=None)

Expand source code

def fit_predict(self,steps_ahead,deterministic,fitting_method,envelope,levy_seed,lags,
                initial_training_window,refit,refit_freq=None,initial_guess = None, 
                cl_optimisation_params =  
                {'nr_steps_optimisation' : 25,'nr_mc_samples'  : 10**4,  'nr_repetitions' : 5},
                max_gaussian_lag = None, nr_samples=None):
    
    #check inputs 
    assert all(isinstance(x, int) and x >0 for x in steps_ahead)
    assert deterministic in [True,False]
    assert fitting_method in ['gmm','cl']
    assert refit in [True,False]  
    if refit == True:
        assert refit_freq >0 and isinstance(refit_freq,int)
        
    assert isinstance(lags,tuple)  and all(isinstance(i,int) for i in lags)
    assert isinstance(initial_training_window,int) and  initial_training_window > 0 
    if fitting_method == 'cl':
        assert set(self.infered_parameters.keys()) == {'nr_mc_samples', 'nr_repetitions', 'nr_steps_optimisation'}
        assert all((isinstance(x,int) and x > 0)  for x in self.intered_parameters.values())
    if deterministic == False:
        assert isinstance(nr_samples,int) and nr_samples > 0

        
    if fitting_method == 'gmm':
        self.fit_gmm(input_values = self.values[:,:initial_training_window],envelope = envelope,
                     levy_seed = levy_seed, lags = lags, initial_guess = initial_guess)
        
    elif fitting_method == 'cl':
        self.fit_cl(input_values = self.values[:,:initial_training_window],
                    envelope = envelope, levy_seed = levy_seed, lags = lags,cl_optimisation_params = 
                    {'nr_steps_optimisation' : 25,'nr_mc_samples'  : 10**4,  'nr_repetitions' : 5},
                    initial_guess = None)
            
    if refit == False:   
        
        return self.predict(input_values = self.values[:,:initial_training_window], steps_ahead = steps_ahead,
                         deterministic = deterministic, max_gaussian_lag = max_gaussian_lag,
                         nr_samples = nr_samples)
        
    elif refit == True:
        
        raise ValueError('not yet implemented')

def grid_creation(self, min_t, max_t)

Creates a grid on $[0,\phi(0)] \times [\text{min_t}, \text{max_t}]$ . Each cell is represented by the coordinates of its bottom left corner. To each cell we associate a sample from each of the gaussian and jump parts of the trawl process.

Returns

gaussian_values: array with the Gaussian of the Levy basis evaluated over the cells
jump_values: array with the jump part of the Levy basis evaluated over the cells

Expand source code

def grid_creation(self,min_t,max_t):
    """Creates a grid on \([0,\phi(0)] \\times [\\text{min_t}, \\text{max_t}]\). Each cell is represented by 
    the coordinates of its bottom left corner. To each cell we associate a sample from each of the gaussian
    and jump parts of the trawl process.
    
    Returns:
      gaussian_values:  array with the Gaussian of the Levy basis evaluated over the cells  
      jump_values: array with the jump part of the Levy basis evaluated over the cells      
    """
        
    coords = np.mgrid[0:self.trawl_function(0):self.mesh_size,min_t:max_t:self.mesh_size]
    x, t   = coords[0].flatten(), coords[1].flatten() 
    
    areas            = self.vol * np.ones([self.nr_simulations,len(t)])
    gaussian_values  = gaussian_part_sampler(self.gaussian_part_params,areas)
    jump_values      = jump_part_sampler(self.jump_part_params,areas,self.jump_part_name)
    
        
    return x,t,gaussian_values,jump_values

def grid_update(self, i, t, gaussian_values, jump_values)

Inputs the values of the Levy basis evaluated over the grid cells on $[\tau_{i-1}+\text{truncation_grid},\tau_{i-1}] \times [0,\phi(0)]$ , removes the values corresponding to cells with time coordinates less than $\tau_{i} + \text{truncation_grid}$ and adds new samples for the levy basis evaluated over the grid cells with time coordinates in $[\tau_{i-1},\tau_i]$ (see figure). Assumes that the consecutive ambit sets at times $\tau_{i-1},\tau_i$ are not disjoint, i.e. $\tau_i + \text{truncation_grid} < \tau_{i-1}$ .

Args

i: index of the trawl to be simulated
t: time coordinates of the cells of the grid on $[\tau_{i-1},\tau_{i-1}+\text{truncation_grid}] \times [0,\phi(0)]$
gaussian_values: gaussian values for the grid on $[\tau_{i-1},\tau_{i-1}+\text{truncation_grid}] \times [0,\phi(0)]$
jump_values: jump values for the grid on $[\tau_{i-1},\tau_{i-1}+\text{truncation_grid}] \times [0,\phi(0)$

Returns

gaussian_values: gaussian values for the grid cells on $[\tau_{i},\tau_{i}+\text{truncation_grid}] \times [0,\phi(0)]$
jump_values: jump values for the grid cells on $[\tau_{i},\tau_{i}+\text{truncation_grid}] \times [0,\phi(0)]$

Expand source code

def grid_update(self,i,t,gaussian_values,jump_values):
    """Inputs the values of the Levy basis evaluated over the grid cells on \([\\tau_{i-1}+\\text{truncation_grid},\\tau_{i-1}] \\times [0,\\phi(0)]\),
    removes the values corresponding to cells with time coordinates less than \(\\tau_{i} + \\text{truncation_grid}\) and adds new samples
    for the levy basis evaluated over the grid cells with time coordinates in \([\\tau_{i-1},\\tau_i]\) (see figure). 
    Assumes that the consecutive ambit sets at times \(\\tau_{i-1},\\tau_i\) are not disjoint, i.e.
    \(\\tau_i + \\text{truncation_grid} < \\tau_{i-1}\).
    
    Args:
      i: index of the trawl to be simulated
      t: time coordinates of the cells of the grid on \([\\tau_{i-1},\\tau_{i-1}+\\text{truncation_grid}] \\times [0,\phi(0)]\)
      gaussian_values: gaussian values for the grid on \([\\tau_{i-1},\\tau_{i-1}+\\text{truncation_grid}] \\times [0,\phi(0)]\)
      jump_values: jump values for the grid on \([\\tau_{i-1},\\tau_{i-1}+\\text{truncation_grid}] \\times [0,\phi(0)\)
    
    Returns:
      gaussian_values: gaussian values for the grid cells on \([\\tau_{i},\\tau_{i}+\\text{truncation_grid}] \\times [0,\phi(0)]\)
      jump_values: jump values for the grid cells on \([\\tau_{i},\\tau_{i}+\\text{truncation_grid}] \\times [0,\phi(0)]\)                                                                                                                                                                                                
     """
      

    ind_to_keep       =  t >= (self.times_grid[i] + self.truncation_grid)
    t[~ind_to_keep]  += -self.truncation_grid
    
    areas             = self.vol * np.ones([self.nr_simulations,sum(~ind_to_keep)])
    #print(gaussian_values[:,~ind_to_keep].shape)
    #print(self.gaussian_part_sampler(areas).shape)
    gaussian_values[:,~ind_to_keep] = gaussian_part_sampler(self.gaussian_part_params,areas)
    jump_values[:,~ind_to_keep]     = jump_part_sampler(self.jump_part_params,areas,self.jump_part_name)  
    #print('ind to keep sum is ', ind_to_keep.sum())
    #print('gaussian is ',gaussian_values.shape)
    #print('non_gaussian_values ',non_gaussian_values[:,ind_to_keep].shape)
    #print('new_gaussian_values ',new_gaussian_values.shape)
    #print('t new shape is ',t.shape)
    #print('x shape is', x.shape)
    
    return t,gaussian_values,jump_values

def predict(self, input_values, steps_ahead, deterministic, max_gaussian_lag=1.0, nr_samples=None)

Expand source code

def predict(self,input_values, steps_ahead, deterministic, max_gaussian_lag = 1.0, nr_samples = None):
    
    #input_values = self.values[:,starting_index:]
    assert isinstance(input_values,np.ndarray) and len(input_values.shape) == 2
    assert deterministic  in [True,False]
    
    ##get the fitted parameters for teh envelope and for the levy seed from the attribute self.infered_parameters

    envelope         = self.infered_parameters['envelope']
    levy_seed        = self.infered_parameters['levy_seed']
    envelope_params  = self.infered_parameters['params']['envelope_params']
    levy_seed_params = self.infered_parameters['params']['levy_seed_params']
    nr_simulations, simulation_length = input_values.shape                                       
    d={}
    
    if levy_seed == 'gaussian':
        assert isinstance(max_gaussian_lag,int) and max_gaussian_lag > 0 and input_values.shape[-1] >= max_gaussian_lag
    
    for nr_steps_ahead in steps_ahead:
        
      if deterministic == True:
          
          array_to_add = np.zeros([nr_simulations,simulation_length - int((max_gaussian_lag - 1)) * (levy_seed == 'gaussian')])
          
      elif deterministic == False:
          
          array_to_add = np.zeros([nr_simulations, simulation_length - int((max_gaussian_lag - 1)) *(levy_seed == 'gaussian'),
                                   nr_samples])

      for i in range(nr_simulations):
          #to deal with gaussian lag helper
          
          if deterministic == True: 
              array_to_add[i] = deterministic_forecasting(tau = self.tau, nr_steps_ahead =  nr_steps_ahead ,
                                values = input_values[i], levy_seed = levy_seed, levy_seed_params = levy_seed_params[i],
                                envelope = envelope, envelope_params = envelope_params[i], 
                                envelope_function = None, max_gaussian_lag = max_gaussian_lag)
                    
          elif deterministic == False:
              print(i)

              array_to_add[i] = probabilistic_forecasting(tau = self.tau, nr_steps_ahead = nr_steps_ahead, values = input_values[i],
                                levy_seed = levy_seed, levy_seed_params = levy_seed_params[i],
                                envelope = envelope, envelope_params = envelope_params[i], nr_samples =  nr_samples,
                                envelope_function = None, max_gaussian_lag = max_gaussian_lag)
      
      d[nr_steps_ahead] =  array_to_add       
              
    return d

def simulate(self, method, slice_convolution_type='diagonals')

Function to simulate from the trawl function. Contains sanity checks for the simulation parameters and uses helper functions for each simulation method.

Args

method: one of the strings cpp, grid or slice
slice_convolution_type: if method is set to slice, this can be one of the strings diagonals or ftt, depending on the way we add up the simulated slices. This argument is ignored if method is set to grid or cpp.

Expand source code

def simulate(self,method,slice_convolution_type='diagonals'):
     """Function to simulate from the trawl function. Contains sanity checks
     for the simulation parameters and uses helper functions for each simulation
     method.
     
     Args:
       method: one of the strings `cpp`, `grid` or `slice`
       slice_convolution_type: if method is set to `slice`, this can be one of the strings `diagonals` or `ftt`, depending on the way we add up the simulated slices. This argument is ignored if method is set to `grid` or `cpp`."""

     #general checks
     assert isinstance(self.nr_simulations,int) and self.nr_simulations >0
     assert method in {'cpp','grid','slice'},'simulation method not supported'
     check_trawl_function(self.trawl_function)
     check_gaussian_params(self.gaussian_part_params)
     
     
     #algorithm specific checks and attribute setting
     if method == 'grid':
         check_jump_part_and_params(self.jump_part_name,self.jump_part_params)
         check_grid_params(self.mesh_size,self.truncation_grid,self.times_grid)
         
         self.nr_trawls = len(self.times_grid)
         self.vol = self.mesh_size **2
         
     elif method == 'cpp':
         check_cpp_params(self.cpp_part_name, self.cpp_part_params,self.cpp_intensity,self.custom_sampler)

         self.nr_trawls = len(self.cpp_times)
             
     elif method == 'slice':
         assert slice_convolution_type in {'fft','diagonals'}
         assert isinstance(self.nr_trawls,int) and self.nr_trawls > 0,'nr_trawls should be a  strictly positive integer'
         check_jump_part_and_params(self.jump_part_name,self.jump_part_params)

         
     self.gaussian_values          =   np.zeros(shape = [self.nr_simulations,self.nr_trawls]) 
     self.jump_values              =   np.zeros(shape = [self.nr_simulations,self.nr_trawls])
     self.cpp_values               =   np.zeros(shape = [self.nr_simulations,self.nr_trawls])
    
    
     if method == 'grid':
         self.simulate_grid()
     elif method == 'cpp':
         self.simulate_cpp()
     elif method == 'slice':
         self.simulate_slice(slice_convolution_type)    

     self.values = self.gaussian_values + self.jump_values + self.cpp_values

def simulate_cpp(self)

text to be added

Expand source code

def simulate_cpp(self):
    """ text to be added"""
    min_t = min(self.cpp_times) + self.cpp_truncation
    max_t = max(self.cpp_times)
    min_x = 0
    max_x = self.trawl_function(0)
    
    for simulation_nr in range(self.nr_simulations):
        
    
        points_x, points_t, associated_values = generate_cpp_points(min_x = min_x, max_x = max_x, 
                    min_t = min_t, max_t = max_t, cpp_part_name = self.cpp_part_name,
                    cpp_part_params = self.cpp_part_params, cpp_intensity = self.cpp_intensity,
                    custom_sampler = self.custom_sampler)
                                
        #(x_i,t_i) in A_t if t < t_i and x_i < phi(t_i-t)
        indicator_matrix = np.tile(points_x[:,np.newaxis],(1,self.nr_trawls)) < \
                        self.trawl_function(np.subtract.outer(points_t, self.cpp_times))
        self.cpp_values[simulation_nr,:] = associated_values @ indicator_matrix

def simulate_grid(self)

Simulate the trawl proces at times self.times_grid, which don't have to be equally distant, via the grid method.

Expand source code

def simulate_grid(self):
    """Simulate the trawl proces at times `self.times_grid`, which don't have to be
    equally distant, via the grid method."""
    
    #If `times_grid` are equidistnant, we do not need to compute `indicators` at each iteration, speeding up the process        

    for i in range(len(self.times_grid)):
         if (i==0) or (self.times_grid[i-1] <= self.times_grid[i] + self.truncation_grid):
             #check that we are creating the grid for the first time or that 
             #trawls at time i-1 and i have empty intersection
             x,t,gaussian_values, jump_values = self.grid_creation(self.times_grid[i] + self.truncation_grid, self.times_grid[i])

            
         elif self.times_grid[i-1] > self.times_grid[i] + self.truncation_grid:
             #check that we have non empty intersection and update the grid
             t,gaussian_values,jump_values = self.grid_update(i,t,gaussian_values,jump_values)
        
         indicators = x < self.trawl_function(t-self.times_grid[i])
         #print(gaussian_values.shape,indicators.shape)
         self.gaussian_values[:,i]  = gaussian_values @ indicators
         self.jump_values[:,i]      = jump_values @ indicators

def simulate_slice(self, slice_convolution_type)

implements algorithm [] from [] and simulates teh trawl process at $\tau,\ldots,\text{nr_trawls}\ \tau$ . slice_convolution_type can be either [to add]

Expand source code

def simulate_slice(self,slice_convolution_type):
    """implements algorithm [] from [] and simulates teh trawl process at 
    \(\\tau,\\ldots,\\text{nr_trawls}\ \\tau\). `slice_convolution_type` can be either [to add]"""
    if self.decorrelation_time == -np.inf:
        self.compute_slice_areas_infinite_decorrelation_time()
        self.simulate_slice_infinite_decorrelation_time(slice_convolution_type)
         
    elif self.decorrelation_time > -np.inf:
        assert(self.trawl_function(self.decorrelation_time)) == 0,'please check decorrelation time' 
        self.compute_slice_areas_finite_decorrelation_time()
        self.simulate_slice_finite_decorrelation_time(slice_convolution_type)

def simulate_slice_finite_decorrelation_time(self, slice_convolution_type)

helper for the simulate_slice method

Expand source code

def simulate_slice_finite_decorrelation_time(self,slice_convolution_type):
    """helper for the `simulate_slice` method"""
    
    filter_ = np.fliplr(np.tril(np.ones(self.I),k=0)) 
    zero_matrix  = np.zeros([self.I,self.I-1])

    for simulation_nr in range(self.nr_simulations):
        gaussian_slices = gaussian_part_sampler(self.gaussian_part_params,self.slice_areas_matrix) 
        jump_slices     = jump_part_sampler(self.jump_part_params,self.slice_areas_matrix,self.jump_part_name)
        
        if slice_convolution_type == 'fft':
    
            gaussian_slices = np.concatenate([zero_matrix,gaussian_slices],axis=1)
            jump_slices = np.concatenate([zero_matrix,jump_slices],axis=1)
    
            #matrix with 1's on and below the secondary diagonal
            #flip the filter to agree with np convention
            self.gaussian_values[simulation_nr,:] = convolve2d(gaussian_slices,filter_[::-1,::-1],'valid')[0]
            self.jump_values[simulation_nr,:]     = convolve2d(jump_slices,filter_[::-1,::-1],'valid')[0]
    
        elif slice_convolution_type == 'diagonals':
            
            self.gaussian_values[simulation_nr,:] = cumulative_and_diagonal_sums(gaussian_slices)
            self.jump_values[simulation_nr,:] =  cumulative_and_diagonal_sums(jump_slices)

def simulate_slice_infinite_decorrelation_time(self, slice_convolution_type)

Helper for the simulate_slice method.

Expand source code

def simulate_slice_infinite_decorrelation_time(self,slice_convolution_type):
    """Helper for the `simulate_slice` method."""

    zero_matrix     = np.zeros([self.nr_trawls,self.nr_trawls-1])
    filter_         = np.fliplr(np.tril(np.ones(self.nr_trawls),k=0)) 


    for simulation_nr in range(self.nr_simulations):
        
        gaussian_slices = gaussian_part_sampler(self.gaussian_part_params,self.slice_areas_matrix) 
        
        #the lower triangular part of the matrix is made oup of 0's, which can result in an error
        #in the scipy.stats sampler (for example, if the levy seed is gamma)
        #to prevent this, we extract the upper triangular part of the matrix as a vector
        #sample this way, then recast the samples as an upper triangular matrix
        slice_areas_row   = (np.fliplr(self.slice_areas_matrix))[np.triu_indices(self.slice_areas_matrix.shape[0], k = 0)]
        jump_slices_row   = jump_part_sampler(self.jump_part_params,slice_areas_row,self.jump_part_name)
        jump_slices       = np.zeros(gaussian_slices.shape)
        jump_slices[np.triu_indices(jump_slices.shape[0], k = 0)]     = jump_slices_row
        jump_slices       = np.fliplr(jump_slices)
         

        if slice_convolution_type == 'fft':
            gaussian_slices = np.concatenate([zero_matrix,gaussian_slices],axis=1)
            jump_slices     = np.concatenate([zero_matrix,jump_slices],axis=1)
            
            self.gaussian_values[simulation_nr,:] = convolve2d(gaussian_slices,filter_[::-1,::-1],'valid')[0]
            self.jump_values[simulation_nr,:]     = convolve2d(jump_slices,filter_[::-1,::-1],'valid')[0]
            
        elif slice_convolution_type == 'diagonals':
            
            self.gaussian_values[simulation_nr,:] = cumulative_and_diagonal_sums(gaussian_slices)
            self.jump_values[simulation_nr,:] =  cumulative_and_diagonal_sums(jump_slices)

def theoretical_acf(self, t_values)

Computes the theoretical acf of the trawl process

Args

t_values: array of time values

Returns

d_acf: a dictionary of the type $t: \text{corr}(X_0,X_t)$ , where $t$ ranges over the input array t_values.

Expand source code

def theoretical_acf(self,t_values):
    """Computes the theoretical acf of the trawl process
    
    Args:
      t_values: array of time values 
    
    Returns:
      d_acf: a dictionary of the type  \(t: \\text{corr}(X_0,X_t)\), where \(t\) ranges over the input array `t_values`. 
    """
    total_area = quad(self.trawl_function,a=-np.inf,b= 0)[0]
    d_acf=dict()
    for t in t_values:
        d_acf[t] = quad(self.trawl_function,a=-np.inf,b= -t)[0]/total_area
    return d_acf