pywatts/pywatts/routines.py

import matplotlib.pyplot as pp
import numpy as np
from sklearn.metrics import explained_variance_score, mean_absolute_error, median_absolute_error
import pandas
from random import randint


def train_split(data, size):
    used_idxs = []
    X_values = {'dc': []}
    y_values = []
    for i in range(size):
        rnd_idx = randint(0, data.size / data.shape[1] - 337)

        if rnd_idx in used_idxs:
            continue
        else:
            used_idxs.append(rnd_idx)

        X_values['dc'].extend(data['dc'][rnd_idx:rnd_idx + 336].tolist())
        y_values.append(data['dc'][rnd_idx + 337].tolist())

    return pandas.DataFrame.from_dict(X_values), pandas.DataFrame.from_dict({'dc': y_values})


def input_query(json_str, idx=0):
    tmp_df = pandas.read_json(json_str)

    return pandas.DataFrame.from_dict(
        {'dc': tmp_df['dc'][idx]}
    )

def input_queries(json_str):
    tmp_df = pandas.read_json(json_str)

    oneH = False
    try:
        s = tmp_df['max_temp'][0]
    except KeyError:
        oneH = True

    queries = []
    for i in range(len(tmp_df)):
        queries.append(pandas.DataFrame.from_dict(
            {'dc': tmp_df['dc'][i]}
        ))
    return oneH, queries


def input_result(json_str, idx=0):
    tmp_df = pandas.read_json(json_str)

    return tmp_df.values[idx]


def train(nn, X_train, y_train, X_val, y_val, steps=100):
    evaluation = []
    for i in range(steps):
        nn.train(X_train, y_train, batch_size=int(len(X_train['dc'].tolist())/336), steps=100)
        evaluation.append(nn.evaluate(X_val, y_val))
        print("Training %s of %s" % ((i+1), steps))
    return evaluation


def plot_training(evaluation):
    loss = []
    steps = []
    for e in evaluation:
        loss.append(e['loss'])
        steps.append(e['global_step'])

    pp.plot(steps, loss)
    # Needed for execution in PyCharm
    pp.show()


def predict(nn, X_pred):
    pred = nn.predict1h(X_pred)
    # Cap results to 0
    predictions = np.array([max(p['predictions'], [0]) for p in pred])
    return predictions


def predict24h(nn, X_pred):
    predictions = []

    input = {'dc': X_pred['dc'].tolist()}

    for i in range(24):
        pred = nn.predict1h(pandas.DataFrame.from_dict(input))
        # Cap prediction to 0
        predictions.extend(list([max(p['predictions'][0], 0) for p in pred]))
        # Remove first value and append predicted value
        del input['dc'][0]
        input['dc'].append(predictions[-1])
        # print("Prediction for hour %d/%d" % (i+1, 24))

    return predictions


def eval_prediction(prediction, result):
    print("The Explained Variance: %.2f" % explained_variance_score(
        result, prediction))
    print("The Mean Absolute Error: %.2f volt dc" % mean_absolute_error(
        result, prediction))
    print("The Median Absolute Error: %.2f volt dc" % median_absolute_error(
        result, prediction))

def jsonify(predictions):
    json_out = "["
    for v in predictions:
        json_out += "[" + str(v) + "],"
    json_out = json_out[:-1] + "]"
    return json_out
add sample data and main functions 2018-06-11 15:20:45 +02:00			`import matplotlib.pyplot as pp`
Fixed feature columns 2018-06-23 15:00:16 +02:00			`import numpy as np`
Add evaluation method 2018-06-11 16:42:13 +02:00			`from sklearn.metrics import explained_variance_score, mean_absolute_error, median_absolute_error`
Added function to convert input json to dataframe 2018-06-11 16:32:58 +02:00			`import pandas`
Fixed a few things 2018-06-21 14:05:30 +02:00			`from random import randint`
Make Training Great Again! 2018-06-11 13:47:02 +02:00
add sample data and main functions 2018-06-11 15:20:45 +02:00


Fixed a few things 2018-06-21 14:05:30 +02:00			`def train_split(data, size):`
Avoid having the same test sample twice 2018-06-23 15:40:23 +02:00			`used_idxs = []`
Rubix changes 2018-09-12 17:52:05 +02:00			`X_values = {'dc': []}`
Fixed a few things 2018-06-21 14:05:30 +02:00			`y_values = []`
			`for i in range(size):`
			`rnd_idx = randint(0, data.size / data.shape[1] - 337)`

Avoid having the same test sample twice 2018-06-23 15:40:23 +02:00			`if rnd_idx in used_idxs:`
			`continue`
			`else:`
			`used_idxs.append(rnd_idx)`

Fixed feature columns 2018-06-23 15:00:16 +02:00			`X_values['dc'].extend(data['dc'][rnd_idx:rnd_idx + 336].tolist())`
			`y_values.append(data['dc'][rnd_idx + 337].tolist())`

Fixed a few things 2018-06-21 14:05:30 +02:00			`return pandas.DataFrame.from_dict(X_values), pandas.DataFrame.from_dict({'dc': y_values})`


Fixed feature columns 2018-06-23 15:00:16 +02:00			`def input_query(json_str, idx=0):`
Added function to convert input json to dataframe 2018-06-11 16:32:58 +02:00			`tmp_df = pandas.read_json(json_str)`

			`return pandas.DataFrame.from_dict(`
Rubix changes 2018-09-12 17:52:05 +02:00			`{'dc': tmp_df['dc'][idx]}`
Added function to convert input json to dataframe 2018-06-11 16:32:58 +02:00			`)`

Add prediction script 2018-09-09 17:25:43 +02:00			`def input_queries(json_str):`
			`tmp_df = pandas.read_json(json_str)`

Rename and fix script 2018-09-11 14:41:52 +02:00			`oneH = False`
			`try:`
			`s = tmp_df['max_temp'][0]`
			`except KeyError:`
			`oneH = True`

Add prediction script 2018-09-09 17:25:43 +02:00			`queries = []`
			`for i in range(len(tmp_df)):`
			`queries.append(pandas.DataFrame.from_dict(`
Rubix changes 2018-09-12 17:52:05 +02:00			`{'dc': tmp_df['dc'][i]}`
Add prediction script 2018-09-09 17:25:43 +02:00			`))`
Rename and fix script 2018-09-11 14:41:52 +02:00			`return oneH, queries`
Add prediction script 2018-09-09 17:25:43 +02:00
Avoid having the same test sample twice 2018-06-23 15:40:23 +02:00
Fixed feature columns 2018-06-23 15:00:16 +02:00			`def input_result(json_str, idx=0):`
			`tmp_df = pandas.read_json(json_str)`

			`return tmp_df.values[idx]`
Added function to convert input json to dataframe 2018-06-11 16:32:58 +02:00
Fixed feature columns 2018-06-23 15:00:16 +02:00
			`def train(nn, X_train, y_train, X_val, y_val, steps=100):`
add sample data and main functions 2018-06-11 15:20:45 +02:00			`evaluation = []`
			`for i in range(steps):`
Avoid having the same test sample twice 2018-06-23 15:40:23 +02:00			`nn.train(X_train, y_train, batch_size=int(len(X_train['dc'].tolist())/336), steps=100)`
Fixed feature columns 2018-06-23 15:00:16 +02:00			`evaluation.append(nn.evaluate(X_val, y_val))`
Machine Teachers hate him for this SIMPLE Trick! 2018-06-11 16:46:03 +02:00			`print("Training %s of %s" % ((i+1), steps))`
add sample data and main functions 2018-06-11 15:20:45 +02:00			`return evaluation`


			`def plot_training(evaluation):`
			`loss = []`
Minor fixes 2018-09-10 19:44:42 +02:00			`steps = []`
add sample data and main functions 2018-06-11 15:20:45 +02:00			`for e in evaluation:`
Minor fixes 2018-09-10 19:44:42 +02:00			`loss.append(e['loss'])`
			`steps.append(e['global_step'])`
Fixed feature columns 2018-06-23 15:00:16 +02:00
Minor fixes 2018-09-10 19:44:42 +02:00			`pp.plot(steps, loss)`
Fixed feature columns 2018-06-23 15:00:16 +02:00			`# Needed for execution in PyCharm`
			`pp.show()`
add sample data and main functions 2018-06-11 15:20:45 +02:00
Add evaluation method 2018-06-11 16:42:13 +02:00
Fixed feature columns 2018-06-23 15:00:16 +02:00			`def predict(nn, X_pred):`
			`pred = nn.predict1h(X_pred)`
Cap all prediction values to zero 2018-08-13 14:42:31 +02:00			`# Cap results to 0`
Rubix changes 2018-09-12 17:52:05 +02:00			`predictions = np.array([max(p['predictions'], [0]) for p in pred])`
Add evaluation method 2018-06-11 16:42:13 +02:00			`return predictions`


Added 24 hour prediction 2018-08-13 14:19:39 +02:00			`def predict24h(nn, X_pred):`
			`predictions = []`

			`input = {'dc': X_pred['dc'].tolist()}`

			`for i in range(24):`
			`pred = nn.predict1h(pandas.DataFrame.from_dict(input))`
Capping to zero 2018-08-13 14:31:39 +02:00			`# Cap prediction to 0`
			`predictions.extend(list([max(p['predictions'][0], 0) for p in pred]))`
Added 24 hour prediction 2018-08-13 14:19:39 +02:00			`# Remove first value and append predicted value`
			`del input['dc'][0]`
			`input['dc'].append(predictions[-1])`
Add prediction script 2018-09-09 17:25:43 +02:00			`# print("Prediction for hour %d/%d" % (i+1, 24))`
Added 24 hour prediction 2018-08-13 14:19:39 +02:00
			`return predictions`


Fixed a few things 2018-06-21 14:05:30 +02:00			`def eval_prediction(prediction, result):`
Add evaluation method 2018-06-11 16:42:13 +02:00			`print("The Explained Variance: %.2f" % explained_variance_score(`
Fixed a few things 2018-06-21 14:05:30 +02:00			`result, prediction))`
Add evaluation method 2018-06-11 16:42:13 +02:00			`print("The Mean Absolute Error: %.2f volt dc" % mean_absolute_error(`
Fixed a few things 2018-06-21 14:05:30 +02:00			`result, prediction))`
Add evaluation method 2018-06-11 16:42:13 +02:00			`print("The Median Absolute Error: %.2f volt dc" % median_absolute_error(`
Fixed a few things 2018-06-21 14:05:30 +02:00			`result, prediction))`
Add evaluation method 2018-06-11 16:42:13 +02:00
Add prediction script 2018-09-09 17:25:43 +02:00			`def jsonify(predictions):`
			`json_out = "["`
			`for v in predictions:`
			`json_out += "[" + str(v) + "],"`
			`json_out = json_out[:-1] + "]"`
			`return json_out`