pyFTS/benchmarks/parallel_benchmarks.py

"""
joblib Parallelized Benchmarks to FTS methods
"""

import datetime
import multiprocessing
import time
from copy import deepcopy

import numpy as np
from joblib import Parallel, delayed

from pyFTS.benchmarks import benchmarks, Util
from pyFTS.common import Util
from pyFTS.partitioners import Grid


def run_point(mfts, partitioner, train_data, test_data, transformation=None, indexer=None):
    """
    Point forecast benchmark function to be executed on threads
    :param mfts: FTS model
    :param partitioner: Universe of Discourse partitioner
    :param train_data: data used to train the model
    :param test_data: ata used to test the model
    :param window_key: id of the sliding window
    :param transformation: data transformation
    :param indexer: seasonal indexer
    :return: a dictionary with the benchmark results 
    """
    pttr = str(partitioner.__module__).split('.')[-1]
    _key = mfts.shortname + " n = " + str(mfts.order) + " " + pttr + " q = " + str(partitioner.partitions)
    mfts.partitioner = partitioner
    if transformation is not None:
        mfts.appendTransformation(transformation)

    try:
        _start = time.time()
        mfts.train(train_data, partitioner.sets, order=mfts.order)
        _end = time.time()
        times = _end - _start

        _start = time.time()
        _rmse, _smape, _u = benchmarks.get_point_statistics(test_data, mfts, indexer)
        _end = time.time()
        times += _end - _start
    except Exception as e:
        print(e)
        _rmse = np.nan
        _smape = np.nan
        _u = np.nan
        times = np.nan

    ret = {'key': _key, 'obj': mfts, 'rmse': _rmse, 'smape': _smape, 'u': _u, 'time': times}

    print(ret)

    return ret


def point_sliding_window(data, windowsize, train=0.8, models=None, partitioners=[Grid.GridPartitioner],
                         partitions=[10], max_order=3, transformation=None, indexer=None, dump=False,
                         save=False, file=None, sintetic=False):
    """
    Parallel sliding window benchmarks for FTS point forecasters
    :param data: 
    :param windowsize: size of sliding window
    :param train: percentual of sliding window data used to train the models
    :param models: FTS point forecasters
    :param partitioners: Universe of Discourse partitioner
    :param partitions: the max number of partitions on the Universe of Discourse 
    :param max_order: the max order of the models (for high order models)
    :param transformation: data transformation
    :param indexer: seasonal indexer
    :param dump: 
    :param save: save results
    :param file: file path to save the results
    :param sintetic: if true only the average and standard deviation of the results
    :return: DataFrame with the results
    """
    _process_start = time.time()

    print("Process Start: {0: %H:%M:%S}".format(datetime.datetime.now()))

    num_cores = multiprocessing.cpu_count()

    pool = []

    objs = {}
    rmse = {}
    smape = {}
    u = {}
    times = {}

    for model in benchmarks.get_point_methods():
        mfts = model("")

        if mfts.is_high_order:
            for order in np.arange(1, max_order + 1):
                if order >= mfts.min_order:
                    mfts = model("")
                    mfts.order = order
                    pool.append(mfts)
        else:
            pool.append(mfts)

    experiments = 0
    for ct, train, test in Util.sliding_window(data, windowsize, train):
        experiments += 1

        if dump: print('\nWindow: {0}\n'.format(ct))

        for partition in partitions:

            for partitioner in partitioners:

                data_train_fs = partitioner(train, partition, transformation=transformation)

                results = Parallel(n_jobs=num_cores)(
                    delayed(run_point)(deepcopy(m), deepcopy(data_train_fs), deepcopy(train), deepcopy(test),
                                       transformation)
                    for m in pool)

                for tmp in results:
                    if tmp['key'] not in objs:
                        objs[tmp['key']] = tmp['obj']
                        rmse[tmp['key']] = []
                        smape[tmp['key']] = []
                        u[tmp['key']] = []
                        times[tmp['key']] = []
                    rmse[tmp['key']].append(tmp['rmse'])
                    smape[tmp['key']].append(tmp['smape'])
                    u[tmp['key']].append(tmp['u'])
                    times[tmp['key']].append(tmp['time'])

    _process_end = time.time()

    print("Process End: {0: %H:%M:%S}".format(datetime.datetime.now()))

    print("Process Duration: {0}".format(_process_end - _process_start))

    return Util.save_dataframe_point(experiments, file, objs, rmse, save, sintetic, smape, times, u)


def run_interval(mfts, partitioner, train_data, test_data, transformation=None, indexer=None):
    """
    Interval forecast benchmark function to be executed on threads
    :param mfts: FTS model
    :param partitioner: Universe of Discourse partitioner
    :param train_data: data used to train the model
    :param test_data: ata used to test the model
    :param window_key: id of the sliding window
    :param transformation: data transformation
    :param indexer: seasonal indexer
    :return: a dictionary with the benchmark results 
    """
    pttr = str(partitioner.__module__).split('.')[-1]
    _key = mfts.shortname + " n = " + str(mfts.order) + " " + pttr + " q = " + str(partitioner.partitions)
    mfts.partitioner = partitioner
    if transformation is not None:
        mfts.appendTransformation(transformation)

    try:
        _start = time.time()
        mfts.train(train_data, partitioner.sets, order=mfts.order)
        _end = time.time()
        times = _end - _start

        _start = time.time()
        _sharp, _res, _cov = benchmarks.get_interval_statistics(test_data, mfts)
        _end = time.time()
        times += _end - _start
    except Exception as e:
        print(e)
        _sharp = np.nan
        _res = np.nan
        _cov = np.nan
        times = np.nan

    ret = {'key': _key, 'obj': mfts, 'sharpness': _sharp, 'resolution': _res, 'coverage': _cov, 'time': times}

    print(ret)

    return ret


def interval_sliding_window(data, windowsize, train=0.8, models=None, partitioners=[Grid.GridPartitioner],
                         partitions=[10], max_order=3, transformation=None, indexer=None, dump=False,
                         save=False, file=None, sintetic=False):
    """
     Parallel sliding window benchmarks for FTS point_to_interval forecasters
     :param data: 
     :param windowsize: size of sliding window
     :param train: percentual of sliding window data used to train the models
     :param models: FTS point forecasters
     :param partitioners: Universe of Discourse partitioner
     :param partitions: the max number of partitions on the Universe of Discourse 
     :param max_order: the max order of the models (for high order models)
     :param transformation: data transformation
     :param indexer: seasonal indexer
     :param dump: 
     :param save: save results
     :param file: file path to save the results
     :param sintetic: if true only the average and standard deviation of the results
     :return: DataFrame with the results
     """
    _process_start = time.time()

    print("Process Start: {0: %H:%M:%S}".format(datetime.datetime.now()))

    num_cores = multiprocessing.cpu_count()

    pool = []

    objs = {}
    sharpness = {}
    resolution = {}
    coverage = {}
    times = {}

    for model in benchmarks.get_interval_methods():
        mfts = model("")

        if mfts.is_high_order:
            for order in np.arange(1, max_order + 1):
                if order >= mfts.min_order:
                    mfts = model("")
                    mfts.order = order
                    pool.append(mfts)
        else:
            pool.append(mfts)

    experiments = 0
    for ct, train, test in Util.sliding_window(data, windowsize, train):
        experiments += 1

        if dump: print('\nWindow: {0}\n'.format(ct))

        for partition in partitions:

            for partitioner in partitioners:

                data_train_fs = partitioner(train, partition, transformation=transformation)

                results = Parallel(n_jobs=num_cores)(
                    delayed(run_interval)(deepcopy(m), deepcopy(data_train_fs), deepcopy(train), deepcopy(test),
                                       transformation)
                    for m in pool)

                for tmp in results:
                    if tmp['key'] not in objs:
                        objs[tmp['key']] = tmp['obj']
                        sharpness[tmp['key']] = []
                        resolution[tmp['key']] = []
                        coverage[tmp['key']] = []
                        times[tmp['key']] = []

                    sharpness[tmp['key']].append(tmp['sharpness'])
                    resolution[tmp['key']].append(tmp['resolution'])
                    coverage[tmp['key']].append(tmp['coverage'])
                    times[tmp['key']].append(tmp['time'])

    _process_end = time.time()

    print("Process End: {0: %H:%M:%S}".format(datetime.datetime.now()))

    print("Process Duration: {0}".format(_process_end - _process_start))

    return Util.save_dataframe_interval(coverage, experiments, file, objs, resolution, save, sharpness, sintetic, times)


def run_ahead(mfts, partitioner, train_data, test_data, steps, resolution, transformation=None, indexer=None):
    """
    Probabilistic m-step ahead forecast benchmark function to be executed on threads
    :param mfts: FTS model
    :param partitioner: Universe of Discourse partitioner
    :param train_data: data used to train the model
    :param test_data: ata used to test the model 
    :param steps: 
    :param resolution: 
    :param transformation: data transformation
    :param indexer: seasonal indexer
    :return: a dictionary with the benchmark results 
    """
    pttr = str(partitioner.__module__).split('.')[-1]
    _key = mfts.shortname + " n = " + str(mfts.order) + " " + pttr + " q = " + str(partitioner.partitions)
    mfts.partitioner = partitioner
    if transformation is not None:
        mfts.appendTransformation(transformation)

    try:
        _start = time.time()
        mfts.train(train_data, partitioner.sets, order=mfts.order)
        _end = time.time()
        times = _end - _start

        _crps1, _crps2, _t1, _t2 = benchmarks.get_distribution_statistics(test_data, mfts, steps=steps,
                                                              resolution=resolution)
        _t1 += times
        _t2 += times
    except Exception as e:
        print(e)
        _crps1 = np.nan
        _crps2 = np.nan
        _t1 = np.nan
        _t2 = np.nan

    ret = {'key': _key, 'obj': mfts, 'CRPS_Interval': _crps1, 'CRPS_Distribution': _crps2, 'TIME_Interval': _t1, 'TIME_Distribution': _t2}

    print(ret)

    return ret


def ahead_sliding_window(data, windowsize, train, steps,resolution, models=None, partitioners=[Grid.GridPartitioner],
                         partitions=[10], max_order=3, transformation=None, indexer=None, dump=False,
                         save=False, file=None, sintetic=False):
    """
    Parallel sliding window benchmarks for FTS probabilistic forecasters
    :param data: 
    :param windowsize: size of sliding window
    :param train: percentual of sliding window data used to train the models
    :param steps: 
    :param resolution: 
    :param models: FTS point forecasters
    :param partitioners: Universe of Discourse partitioner
    :param partitions: the max number of partitions on the Universe of Discourse 
    :param max_order: the max order of the models (for high order models)
    :param transformation: data transformation
    :param indexer: seasonal indexer
    :param dump: 
    :param save: save results
    :param file: file path to save the results
    :param sintetic: if true only the average and standard deviation of the results
    :return: DataFrame with the results 
    """
    _process_start = time.time()

    print("Process Start: {0: %H:%M:%S}".format(datetime.datetime.now()))

    num_cores = multiprocessing.cpu_count()

    pool = []

    objs = {}
    crps_interval = {}
    crps_distr = {}
    times1 = {}
    times2 = {}

    for model in benchmarks.get_interval_methods():
        mfts = model("")

        if mfts.is_high_order:
            for order in np.arange(1, max_order + 1):
                if order >= mfts.min_order:
                    mfts = model("")
                    mfts.order = order
                    pool.append(mfts)
        else:
            pool.append(mfts)

    experiments = 0
    for ct, train, test in Util.sliding_window(data, windowsize, train):
        experiments += 1

        if dump: print('\nWindow: {0}\n'.format(ct))

        for partition in partitions:

            for partitioner in partitioners:

                data_train_fs = partitioner(train, partition, transformation=transformation)

                results = Parallel(n_jobs=num_cores)(
                    delayed(run_ahead)(deepcopy(m), deepcopy(data_train_fs), deepcopy(train), deepcopy(test),
                                       steps, resolution, transformation)
                    for m in pool)

                for tmp in results:
                    if tmp['key'] not in objs:
                        objs[tmp['key']] = tmp['obj']
                        crps_interval[tmp['key']] = []
                        crps_distr[tmp['key']] = []
                        times1[tmp['key']] = []
                        times2[tmp['key']] = []

                    crps_interval[tmp['key']].append(tmp['CRPS_Interval'])
                    crps_distr[tmp['key']].append(tmp['CRPS_Distribution'])
                    times1[tmp['key']].append(tmp['TIME_Interval'])
                    times2[tmp['key']].append(tmp['TIME_Distribution'])

    _process_end = time.time()

    print("Process End: {0: %H:%M:%S}".format(datetime.datetime.now()))

    print("Process Duration: {0}".format(_process_end - _process_start))

    return Util.save_dataframe_ahead(experiments, file, objs, crps_interval, crps_distr, times1, times2, save, sintetic)
- Issue #3 - Code documentation with PEP 257 compliance 2017-05-05 22:01:45 +04:00			`"""`
			`joblib Parallelized Benchmarks to FTS methods`
			`"""`

- Issue #3 - Code documentation with PEP 257 compliance - Benchmarks refactoring and optimizations - Probabilistic package, with Kernel Density Estimation 2017-05-08 20:12:08 +04:00			`import datetime`
- Adding gaussmf and trapmf support on partitioners - Parallel util for partitioners 2017-04-01 03:34:12 +04:00			`import multiprocessing`
- Issue #3 - Code documentation with PEP 257 compliance - Benchmarks refactoring and optimizations - Probabilistic package, with Kernel Density Estimation 2017-05-08 20:12:08 +04:00			`import time`
			`from copy import deepcopy`
- Adding gaussmf and trapmf support on partitioners - Parallel util for partitioners 2017-04-01 03:34:12 +04:00
Parallel benchmarks - sliding window por point forecasts 2017-04-01 19:19:37 +04:00			`import numpy as np`
- Issue #3 - Code documentation with PEP 257 compliance - Benchmarks refactoring and optimizations - Probabilistic package, with Kernel Density Estimation 2017-05-08 20:12:08 +04:00			`from joblib import Parallel, delayed`

			`from pyFTS.benchmarks import benchmarks, Util`
			`from pyFTS.common import Util`
			`from pyFTS.partitioners import Grid`
Parallel benchmarks - sliding window por point forecasts 2017-04-01 19:19:37 +04:00

- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`def run_point(mfts, partitioner, train_data, test_data, transformation=None, indexer=None):`
- Issue #3 - Code documentation with PEP 257 compliance 2017-05-07 04:19:04 +04:00			`"""`
			`Point forecast benchmark function to be executed on threads`
			`:param mfts: FTS model`
			`:param partitioner: Universe of Discourse partitioner`
			`:param train_data: data used to train the model`
			`:param test_data: ata used to test the model`
			`:param window_key: id of the sliding window`
			`:param transformation: data transformation`
			`:param indexer: seasonal indexer`
			`:return: a dictionary with the benchmark results`
			`"""`
Parallel benchmarks - sliding window por point forecasts 2017-04-01 19:19:37 +04:00			`pttr = str(partitioner.__module__).split('.')[-1]`
- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`_key = mfts.shortname + " n = " + str(mfts.order) + " " + pttr + " q = " + str(partitioner.partitions)`
Parallel benchmarks - sliding window por point forecasts 2017-04-01 19:19:37 +04:00			`mfts.partitioner = partitioner`
			`if transformation is not None:`
			`mfts.appendTransformation(transformation)`

			`try:`
			`_start = time.time()`
- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`mfts.train(train_data, partitioner.sets, order=mfts.order)`
Parallel benchmarks - sliding window por point forecasts 2017-04-01 19:19:37 +04:00			`_end = time.time()`
			`times = _end - _start`

			`_start = time.time()`
			`_rmse, _smape, _u = benchmarks.get_point_statistics(test_data, mfts, indexer)`
			`_end = time.time()`
			`times += _end - _start`
			`except Exception as e:`
			`print(e)`
			`_rmse = np.nan`
- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`_smape = np.nan`
Parallel benchmarks - sliding window por point forecasts 2017-04-01 19:19:37 +04:00			`_u = np.nan`
			`times = np.nan`

- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`ret = {'key': _key, 'obj': mfts, 'rmse': _rmse, 'smape': _smape, 'u': _u, 'time': times}`
Parallel benchmarks - sliding window por point forecasts 2017-04-01 19:19:37 +04:00
			`print(ret)`

			`return ret`


- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`def point_sliding_window(data, windowsize, train=0.8, models=None, partitioners=[Grid.GridPartitioner],`
			`partitions=[10], max_order=3, transformation=None, indexer=None, dump=False,`
			`save=False, file=None, sintetic=False):`
- Issue #3 - Code documentation with PEP 257 compliance 2017-05-07 04:19:04 +04:00			`"""`
			`Parallel sliding window benchmarks for FTS point forecasters`
			`:param data:`
			`:param windowsize: size of sliding window`
			`:param train: percentual of sliding window data used to train the models`
			`:param models: FTS point forecasters`
			`:param partitioners: Universe of Discourse partitioner`
			`:param partitions: the max number of partitions on the Universe of Discourse`
			`:param max_order: the max order of the models (for high order models)`
			`:param transformation: data transformation`
			`:param indexer: seasonal indexer`
			`:param dump:`
			`:param save: save results`
			`:param file: file path to save the results`
			`:param sintetic: if true only the average and standard deviation of the results`
			`:return: DataFrame with the results`
			`"""`
- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`_process_start = time.time()`
Parallel benchmarks - sliding window por point forecasts 2017-04-01 19:19:37 +04:00
- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`print("Process Start: {0: %H:%M:%S}".format(datetime.datetime.now()))`
Parallel benchmarks - sliding window por point forecasts 2017-04-01 19:19:37 +04:00
			`num_cores = multiprocessing.cpu_count()`

- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`pool = []`

Parallel benchmarks - sliding window por point forecasts 2017-04-01 19:19:37 +04:00			`objs = {}`
			`rmse = {}`
			`smape = {}`
			`u = {}`
			`times = {}`

- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`for model in benchmarks.get_point_methods():`
			`mfts = model("")`

- Issue #3 - Code documentation with PEP 257 compliance 2017-05-05 22:01:45 +04:00			`if mfts.is_high_order:`
- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`for order in np.arange(1, max_order + 1):`
- Issue #3 - Code documentation with PEP 257 compliance 2017-05-05 22:01:45 +04:00			`if order >= mfts.min_order:`
- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`mfts = model("")`
			`mfts.order = order`
			`pool.append(mfts)`
			`else:`
			`pool.append(mfts)`

			`experiments = 0`
			`for ct, train, test in Util.sliding_window(data, windowsize, train):`
			`experiments += 1`

			`if dump: print('\nWindow: {0}\n'.format(ct))`

Parallel benchmarks - sliding window por point forecasts 2017-04-01 19:19:37 +04:00			`for partition in partitions:`
- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00
Parallel benchmarks - sliding window por point forecasts 2017-04-01 19:19:37 +04:00			`for partitioner in partitioners:`
- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00
Parallel benchmarks - sliding window por point forecasts 2017-04-01 19:19:37 +04:00			`data_train_fs = partitioner(train, partition, transformation=transformation)`

- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`results = Parallel(n_jobs=num_cores)(`
			`delayed(run_point)(deepcopy(m), deepcopy(data_train_fs), deepcopy(train), deepcopy(test),`
			`transformation)`
			`for m in pool)`
Parallel benchmarks - sliding window por point forecasts 2017-04-01 19:19:37 +04:00
			`for tmp in results:`
			`if tmp['key'] not in objs:`
			`objs[tmp['key']] = tmp['obj']`
			`rmse[tmp['key']] = []`
			`smape[tmp['key']] = []`
			`u[tmp['key']] = []`
			`times[tmp['key']] = []`
			`rmse[tmp['key']].append(tmp['rmse'])`
			`smape[tmp['key']].append(tmp['smape'])`
			`u[tmp['key']].append(tmp['u'])`
			`times[tmp['key']].append(tmp['time'])`

- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`_process_end = time.time()`

			`print("Process End: {0: %H:%M:%S}".format(datetime.datetime.now()))`

			`print("Process Duration: {0}".format(_process_end - _process_start))`

- Issue #3 - Code documentation with PEP 257 compliance - Benchmarks refactoring and optimizations - Probabilistic package, with Kernel Density Estimation 2017-05-08 20:12:08 +04:00			`return Util.save_dataframe_point(experiments, file, objs, rmse, save, sintetic, smape, times, u)`
- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00

			`def run_interval(mfts, partitioner, train_data, test_data, transformation=None, indexer=None):`
- Issue #3 - Code documentation with PEP 257 compliance 2017-05-07 04:19:04 +04:00			`"""`
			`Interval forecast benchmark function to be executed on threads`
			`:param mfts: FTS model`
			`:param partitioner: Universe of Discourse partitioner`
			`:param train_data: data used to train the model`
			`:param test_data: ata used to test the model`
			`:param window_key: id of the sliding window`
			`:param transformation: data transformation`
			`:param indexer: seasonal indexer`
			`:return: a dictionary with the benchmark results`
			`"""`
- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`pttr = str(partitioner.__module__).split('.')[-1]`
			`_key = mfts.shortname + " n = " + str(mfts.order) + " " + pttr + " q = " + str(partitioner.partitions)`
			`mfts.partitioner = partitioner`
			`if transformation is not None:`
			`mfts.appendTransformation(transformation)`

			`try:`
			`_start = time.time()`
			`mfts.train(train_data, partitioner.sets, order=mfts.order)`
			`_end = time.time()`
			`times = _end - _start`

			`_start = time.time()`
			`_sharp, _res, _cov = benchmarks.get_interval_statistics(test_data, mfts)`
			`_end = time.time()`
			`times += _end - _start`
			`except Exception as e:`
			`print(e)`
			`_sharp = np.nan`
			`_res = np.nan`
			`_cov = np.nan`
			`times = np.nan`

			`ret = {'key': _key, 'obj': mfts, 'sharpness': _sharp, 'resolution': _res, 'coverage': _cov, 'time': times}`

			`print(ret)`

			`return ret`


			`def interval_sliding_window(data, windowsize, train=0.8, models=None, partitioners=[Grid.GridPartitioner],`
			`partitions=[10], max_order=3, transformation=None, indexer=None, dump=False,`
			`save=False, file=None, sintetic=False):`
- Issue #3 - Code documentation with PEP 257 compliance 2017-05-07 04:19:04 +04:00			`"""`
- Implementation of interval and distribution m-step ahead forecasts for arima and quantreg 2017-05-15 21:06:26 +04:00			`Parallel sliding window benchmarks for FTS point_to_interval forecasters`
- Issue #3 - Code documentation with PEP 257 compliance 2017-05-07 04:19:04 +04:00			`:param data:`
			`:param windowsize: size of sliding window`
			`:param train: percentual of sliding window data used to train the models`
			`:param models: FTS point forecasters`
			`:param partitioners: Universe of Discourse partitioner`
			`:param partitions: the max number of partitions on the Universe of Discourse`
			`:param max_order: the max order of the models (for high order models)`
			`:param transformation: data transformation`
			`:param indexer: seasonal indexer`
			`:param dump:`
			`:param save: save results`
			`:param file: file path to save the results`
			`:param sintetic: if true only the average and standard deviation of the results`
			`:return: DataFrame with the results`
			`"""`
- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`_process_start = time.time()`

			`print("Process Start: {0: %H:%M:%S}".format(datetime.datetime.now()))`

			`num_cores = multiprocessing.cpu_count()`

			`pool = []`

			`objs = {}`
			`sharpness = {}`
			`resolution = {}`
			`coverage = {}`
			`times = {}`

			`for model in benchmarks.get_interval_methods():`
			`mfts = model("")`

- Issue #3 - Code documentation with PEP 257 compliance 2017-05-05 22:01:45 +04:00			`if mfts.is_high_order:`
- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`for order in np.arange(1, max_order + 1):`
- Issue #3 - Code documentation with PEP 257 compliance 2017-05-05 22:01:45 +04:00			`if order >= mfts.min_order:`
- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`mfts = model("")`
			`mfts.order = order`
			`pool.append(mfts)`
			`else:`
			`pool.append(mfts)`

			`experiments = 0`
			`for ct, train, test in Util.sliding_window(data, windowsize, train):`
			`experiments += 1`

			`if dump: print('\nWindow: {0}\n'.format(ct))`

			`for partition in partitions:`

			`for partitioner in partitioners:`

			`data_train_fs = partitioner(train, partition, transformation=transformation)`

			`results = Parallel(n_jobs=num_cores)(`
			`delayed(run_interval)(deepcopy(m), deepcopy(data_train_fs), deepcopy(train), deepcopy(test),`
			`transformation)`
			`for m in pool)`

			`for tmp in results:`
			`if tmp['key'] not in objs:`
			`objs[tmp['key']] = tmp['obj']`
			`sharpness[tmp['key']] = []`
			`resolution[tmp['key']] = []`
			`coverage[tmp['key']] = []`
			`times[tmp['key']] = []`

			`sharpness[tmp['key']].append(tmp['sharpness'])`
			`resolution[tmp['key']].append(tmp['resolution'])`
			`coverage[tmp['key']].append(tmp['coverage'])`
			`times[tmp['key']].append(tmp['time'])`

			`_process_end = time.time()`

			`print("Process End: {0: %H:%M:%S}".format(datetime.datetime.now()))`

			`print("Process Duration: {0}".format(_process_end - _process_start))`

- Issue #3 - Code documentation with PEP 257 compliance - Benchmarks refactoring and optimizations - Probabilistic package, with Kernel Density Estimation 2017-05-08 20:12:08 +04:00			`return Util.save_dataframe_interval(coverage, experiments, file, objs, resolution, save, sharpness, sintetic, times)`
- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00

			`def run_ahead(mfts, partitioner, train_data, test_data, steps, resolution, transformation=None, indexer=None):`
- Issue #3 - Code documentation with PEP 257 compliance 2017-05-07 04:19:04 +04:00			`"""`
			`Probabilistic m-step ahead forecast benchmark function to be executed on threads`
			`:param mfts: FTS model`
			`:param partitioner: Universe of Discourse partitioner`
			`:param train_data: data used to train the model`
			`:param test_data: ata used to test the model`
			`:param steps:`
			`:param resolution:`
			`:param transformation: data transformation`
			`:param indexer: seasonal indexer`
			`:return: a dictionary with the benchmark results`
			`"""`
- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`pttr = str(partitioner.__module__).split('.')[-1]`
			`_key = mfts.shortname + " n = " + str(mfts.order) + " " + pttr + " q = " + str(partitioner.partitions)`
			`mfts.partitioner = partitioner`
			`if transformation is not None:`
			`mfts.appendTransformation(transformation)`

			`try:`
			`_start = time.time()`
			`mfts.train(train_data, partitioner.sets, order=mfts.order)`
			`_end = time.time()`
			`times = _end - _start`

			`_crps1, _crps2, _t1, _t2 = benchmarks.get_distribution_statistics(test_data, mfts, steps=steps,`
			`resolution=resolution)`
			`_t1 += times`
			`_t2 += times`
			`except Exception as e:`
			`print(e)`
			`_crps1 = np.nan`
			`_crps2 = np.nan`
			`_t1 = np.nan`
			`_t2 = np.nan`

			`ret = {'key': _key, 'obj': mfts, 'CRPS_Interval': _crps1, 'CRPS_Distribution': _crps2, 'TIME_Interval': _t1, 'TIME_Distribution': _t2}`

			`print(ret)`

			`return ret`


			`def ahead_sliding_window(data, windowsize, train, steps,resolution, models=None, partitioners=[Grid.GridPartitioner],`
			`partitions=[10], max_order=3, transformation=None, indexer=None, dump=False,`
			`save=False, file=None, sintetic=False):`
- Issue #3 - Code documentation with PEP 257 compliance 2017-05-07 04:19:04 +04:00			`"""`
			`Parallel sliding window benchmarks for FTS probabilistic forecasters`
			`:param data:`
			`:param windowsize: size of sliding window`
			`:param train: percentual of sliding window data used to train the models`
			`:param steps:`
			`:param resolution:`
			`:param models: FTS point forecasters`
			`:param partitioners: Universe of Discourse partitioner`
			`:param partitions: the max number of partitions on the Universe of Discourse`
			`:param max_order: the max order of the models (for high order models)`
			`:param transformation: data transformation`
			`:param indexer: seasonal indexer`
			`:param dump:`
			`:param save: save results`
			`:param file: file path to save the results`
			`:param sintetic: if true only the average and standard deviation of the results`
			`:return: DataFrame with the results`
			`"""`
- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`_process_start = time.time()`

			`print("Process Start: {0: %H:%M:%S}".format(datetime.datetime.now()))`

			`num_cores = multiprocessing.cpu_count()`

			`pool = []`

			`objs = {}`
			`crps_interval = {}`
			`crps_distr = {}`
			`times1 = {}`
			`times2 = {}`

			`for model in benchmarks.get_interval_methods():`
			`mfts = model("")`

- Issue #3 - Code documentation with PEP 257 compliance 2017-05-05 22:01:45 +04:00			`if mfts.is_high_order:`
- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`for order in np.arange(1, max_order + 1):`
- Issue #3 - Code documentation with PEP 257 compliance 2017-05-05 22:01:45 +04:00			`if order >= mfts.min_order:`
- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`mfts = model("")`
			`mfts.order = order`
			`pool.append(mfts)`
			`else:`
			`pool.append(mfts)`

			`experiments = 0`
			`for ct, train, test in Util.sliding_window(data, windowsize, train):`
			`experiments += 1`

			`if dump: print('\nWindow: {0}\n'.format(ct))`

			`for partition in partitions:`

			`for partitioner in partitioners:`

			`data_train_fs = partitioner(train, partition, transformation=transformation)`

			`results = Parallel(n_jobs=num_cores)(`
			`delayed(run_ahead)(deepcopy(m), deepcopy(data_train_fs), deepcopy(train), deepcopy(test),`
			`steps, resolution, transformation)`
			`for m in pool)`

			`for tmp in results:`
			`if tmp['key'] not in objs:`
			`objs[tmp['key']] = tmp['obj']`
			`crps_interval[tmp['key']] = []`
			`crps_distr[tmp['key']] = []`
			`times1[tmp['key']] = []`
			`times2[tmp['key']] = []`
- Adding gaussmf and trapmf support on partitioners - Parallel util for partitioners 2017-04-01 03:34:12 +04:00
- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`crps_interval[tmp['key']].append(tmp['CRPS_Interval'])`
			`crps_distr[tmp['key']].append(tmp['CRPS_Distribution'])`
			`times1[tmp['key']].append(tmp['TIME_Interval'])`
			`times2[tmp['key']].append(tmp['TIME_Distribution'])`
- Adding gaussmf and trapmf support on partitioners - Parallel util for partitioners 2017-04-01 03:34:12 +04:00
- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`_process_end = time.time()`
- Adding gaussmf and trapmf support on partitioners - Parallel util for partitioners 2017-04-01 03:34:12 +04:00
- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`print("Process End: {0: %H:%M:%S}".format(datetime.datetime.now()))`
- Adding gaussmf and trapmf support on partitioners - Parallel util for partitioners 2017-04-01 03:34:12 +04:00
- Parallel sliding window benchmarks 2017-04-05 01:39:15 +04:00			`print("Process Duration: {0}".format(_process_end - _process_start))`
- Adding gaussmf and trapmf support on partitioners - Parallel util for partitioners 2017-04-01 03:34:12 +04:00
- Issue #3 - Code documentation with PEP 257 compliance - Benchmarks refactoring and optimizations - Probabilistic package, with Kernel Density Estimation 2017-05-08 20:12:08 +04:00			`return Util.save_dataframe_ahead(experiments, file, objs, crps_interval, crps_distr, times1, times2, save, sintetic)`