pandorafms/pandora_console/include/functions_forecast.php

229 lines
6.7 KiB
PHP

<?php
// Pandora FMS - http://pandorafms.com
// ==================================================
// Copyright (c) 2005-2010 Artica Soluciones Tecnologicas
// Please see http://pandorafms.org for full contribution list
// This program is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public License
// as published by the Free Software Foundation; version 2
// This program is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
// GNU General Public License for more details.
/**
* @package Include
* @subpackage Forecast
*/
/**
* Create a prediction based on module data with least square method (linear regression)
*
* @param int Module id.
* @param int Period of the module data.
* @param int Period of the prediction or false to use it in prediction_date function (see below).
* @param int Maximun value using this function for prediction_date.
* @param int Minimun value using this function for prediction_date.
* @param bool Result data for CSV file exportation.
*
* @return array Void array or prediction of the module data.
*/
function forecast_projection_graph($module_id, $period = 5184000, $prediction_period, $max_value = false, $min_value = false, $csv = false){
global $config;
$module_data=grafico_modulo_sparse ($module_id, $period, 0,
300, 300 , '', null,
false, 0, false,
0, '', 0, 1, false,
true, '', 1, true);
if (empty($module_data)){
return array();
}
// Prevents bad behaviour over image error
else if (!is_array($module_data) and preg_match('/^<img(.)*$/', $module_data)){
return;
}
// Data initialization
$sum_obs = 0;
$sum_xi = 0;
$sum_yi = 0;
$sum_xi_yi = 0;
$sum_xi2 = 0;
$sum_yi2 = 0;
$sum_diff_dates = 0;
$last_timestamp = get_system_time();
$agent_interval = 300;
$cont = 1;
$data = array();
$table->data = array();
// Creates data for calculation
foreach ($module_data as $utimestamp => $row) {
if ($utimestamp == '') { continue; }
$data[0] = '';
$data[1] = $cont;
$data[2] = date('d M Y H:i:s', $utimestamp);
$data[3] = $utimestamp;
$data[4] = $row['sum'];
$data[5] = $utimestamp * $row['sum'];
$data[6] = $utimestamp * $utimestamp;
$data[7] = $row['sum'] * $row['sum'];
if ($cont == 1){
$data[8] = 0;
}else{
$data[8] = $utimestamp - $last_timestamp;
}
$sum_obs = $sum_obs + $cont;
$sum_xi = $sum_xi + $utimestamp;
$sum_yi = $sum_yi + $row['sum'];
$sum_xi_yi = $sum_xi_yi + $data[5];
$sum_xi2 = $sum_xi2 + $data[6];
$sum_yi2 = $sum_yi2 + $data[7];
$sum_diff_dates = $sum_diff_dates + $data[8];
$last_timestamp = $utimestamp;
$cont++;
array_push($table->data, $data);
}
$cont--;
// Calculation over data above:
// 1. Calculation of linear correlation coefficient...
// 1.1 Average for X: Sum(Xi)/Obs
// 1.2 Average for Y: Sum(Yi)/Obs
// 2. Covariance between vars
// 3.1 Standard deviation for X: sqrt((Sum(Xi²)/Obs) - (avg X)²)
// 3.2 Standard deviation for Y: sqrt((Sum(Yi²)/Obs) - (avg Y)²)
// Linear correlation coefficient:
$avg_x = $cont/$sum_xi;
$avg_y = $cont/$sum_yi;
$covariance = $sum_xi_yi/$cont;
$dev_x = sqrt(($sum_xi2/$cont) - ($avg_x*$avg_x));
$dev_y = sqrt(($sum_yi2/$cont) - ($avg_y*$avg_y));
// Prevents division by zero
if ($dev_x != 0 and $dev_y != 0){
$linear_coef = $covariance / ($dev_x * $dev_y);
}
// Agent interval could be zero, 300 is the predefined
($sum_obs == 0)? $agent_interval = 300 : $agent_interval = $sum_diff_dates / $sum_obs;
// Could be a inverse correlation coefficient
// if $linear_coef < 0.0
// if $linear_coef >= -1.0 and $linear_coef <= -0.8999
// Function variables have an inverse linear relathionship!
// else
// Function variables don't have an inverse linear relathionship!
// Could be a direct correlation coefficient
// else
// if ($linear_coef >= 0.8999 and $linear_coef <= 1.0) {
// Function variables have a direct linear relathionship!
// else
// Function variables don't have a direct linear relathionship!
// 2. Calculation of linear regresion...
$b_num = (($cont * $sum_xi_yi) - ($sum_xi * $sum_yi));
$b_den = (($cont * $sum_xi2) - ($sum_xi * $sum_xi));
$b = $b_num / $b_den;
$a_num = ($sum_yi) - ($b * $sum_xi);
$a = $a_num / $cont;
// Data inicialization
$output_data = array();
if ($prediction_period != false){
$limit_timestamp = $last_timestamp + $prediction_period;
}
$current_ts = $last_timestamp;
$in_range = true;
$time_format_2 = '';
$temp_range = $period;
if ($period < $prediction_period)
$temp_range = $prediction_period;
if ($temp_range <= 21600) {
$time_format = 'H:i:s';
}
elseif ($temp_range < 86400) {
$time_format = 'H:i';
}
elseif ($temp_range < 1296000) {
$time_format = 'M d';
$time_format_2 = 'H\h';
}
elseif ($temp_range <= 2592000) {
$time_format = 'M d';
$time_format_2 = 'H\h';
}
else {
$time_format = 'M d';
}
// Aplying linear regression to module data in order to do the prediction
$output_data = array();
$idx = 0;
// Create data in graph format like
while ($in_range){
$timestamp_f = date($time_format, $current_ts);
//$timestamp_f = date($time_format, $current_ts);
$timestamp_f = graph_get_formatted_date($current_ts, $time_format, $time_format_2);
if ($csv){
$output_data[$idx]['date'] = $current_ts;
$output_data[$idx]['data'] = ($a + ($b * $current_ts));
}
else{
$output_data[$timestamp_f] = ($a + ($b * $current_ts));
}
// Using this function for prediction_date
if ($prediction_period == false){
// This statements stop the prediction when interval is greater than 4 years
if ($current_ts - $last_timestamp >= 126144000){
return false;
}
//html_debug_print(" Date " . $timestamp_f . " data: " . $output_data[$timestamp_f]);
// Found it
if ($max_value >= $output_data[$timestamp_f] and $min_value <= $output_data[$timestamp_f]){
return $current_ts;
}
}else if ($current_ts > $limit_timestamp){
$in_range = false;
}
$current_ts = $current_ts + $agent_interval;
$idx++;
}
return $output_data;
}
/**
* Return a date when the date interval is reached
*
* @param int Module id.
* @param int Given data period to make the prediction
* @param int Max value in the interval.
* @param int Min value in the interval.
*
* @return mixed timestamp with the prediction date or false
*/
function forecast_prediction_date ($module_id, $period = 5184000, $max_value = 0, $min_value = 0){
// Checks interval
if ($min_value > $max_value){
return false;
}
return forecast_projection_graph($module_id, $period, false, $max_value, $min_value);
}