plotting.py

# python libraries
import numpy as np
import tensorflow as tf
import pickle
import pandas as pd
import matplotlib.pyplot as plt
import gc
import pprint

#my scripts
import go_parser as gp
import DNN_go_tensorflow as dnn_go
import visualization as vz


COLUMNS = [chr(ord('a') + i) for i in range(19)]
ROWS = [chr(ord('a') + i) for i in range(19)]

def main():
    draw_board_probabilities_10_step()


def patch_size():
    # result = {"x": [], "train": [], "test": [], "time": []}
    # go_data = gp.parse_games(num_games=10000, first_n_moves=10, onehot=True)
    # for size in range(3, 12):
    #     train_accu, test_accu, time, dummy = dnn_go.conv(
    #         go_data, conv_patch_size=size, pooling=True)
    #     result["x"].append(size)
    #     result["train"].append(train_accu[-1])
    #     result["test"].append(test_accu[-1])
    #     result["time"].append(time)
    # pprint.pprint(result)
    # with open("generated_result/patch_size", "w") as f:
    #     f.write(pickle.dumps(result))
    #     f.close()
    accu = {'test': [0.42558536,
                       0.42783415,
                       0.42655641,
                      0.42819193,
                      0.43125847,
                      0.43110517,
                      0.42829415,
                      0.43008298,
                      0.43003187],
             'time': [425.863521,
                      429.166862,
                      460.774318,
                      461.709615,
                      437.670243,
                      440.934634,
                      446.709425,
                      449.771147,
                      445.710461],
             'train': [0.4609375,
                       0.5546875,
                       0.5078125,
                       0.4765625,
                       0.53125,
                       0.59375,
                       0.46875,
                       0.546875,
                       0.53125],
             'x': [3, 4, 5, 6, 7, 8, 9, 10, 11]}


    fig, ax1 = plt.subplots()
    ax1.plot(accu['x'], accu['test'], 'bo-')
    ax1.plot(accu['x'], accu['train'], 'r*-')
    ax1.set_xlabel("conv patch size")
    # Make the y-axis label and tick labels match the line color.
    ax1.set_ylabel('prediction accuracy', color='b')

    plt.title("prediction accuracy influenced by patch size")
    ax1.legend(["test accuracy", "train accuracy"], loc="best")

    axbox = ax1.get_position()

    plt.show()

def pooling_or_not():
    # results = {"pooling": {"train": [], "test": [], "time": 0},
    #            "not pooling": {"train": [], "test": [], "time": 0}}
    # go_data = gp.parse_games(num_games=1000, first_n_moves=10, onehot=True)
    # for pool in ["pooling", "not pooling"]:
    #     (results[pool]["train"], results[pool]["test"],
    #      results[pool]["time"], dummy) = dnn_go.conv(go_data, pooling=pool)
    # print results
    # with open("generated_data/pooling.pkl", "w") as f:
    #     f.write(pickle.dumps(results))
    #     f.close()

    with open("generated_data/pooling.pkl", "r") as f:
        accu = pickle.loads(f.read())
        f.close()

    colors = ["g", "r", "b", "m"]
    i = 0
    for p in ["pooling", "not pooling"]:
        epochs= range(len(accu[p]['test']))

        plt.plot(epochs, accu[p]['test'], colors[i] + 'o-')
        i += 1
        plt.plot(epochs, accu[p]['train'], colors[i] + '*-')
        i += 1
    plt.xlabel("number of epochs")
    plt.title("Pooling or Not Pooling after convolutional layer")
    plt.legend(["test accuracy with pooling", "train accuracy with pooling",
                "test accuracy without pooling", "train accuracy without pooling"], loc='best')

    plt.show()

def dropout_or_not():
    go_data = gp.parse_games(num_games=10000, first_n_moves=10, onehot=True)
    x = [0.0, .2, 0.5, 0.8]
    train_accu = []
    test_accu = []
    time = []
    for rate in x:
        train_accuracy, test_accuracy, training_time, epoch_time = dnn_go.basic_3layer_NN(
            go_data, hidden_layer_num=2000, dropout_rate=rate)
        train_accu.append(train_accuracy)
        test_accu.append(test_accuracy)
        time.append(training_time)
    # with open("generated_data/dropout_or_not.pkl", "w") as f:
    #     f.write(pickle.dumps({"x": x, "train accuracy": train_accu,
    #                           "test accuracy": test_accu, "time": time}))

    # with open("generated_data/dropout_or_not.pkl", "r") as f:
    #     accu = pickle.loads(f.read())
    #
    # fig, ax1 = plt.subplots()
    # ax1.plot(accu['x'], accu['test accuracy'], 'bo-')
    # ax1.plot(accu['x'], accu['train accuracy'], 'g*-')
    # ax1.set_xlabel("dropout rate")
    # # Make the y-axis label and tick labels match the line color.
    # ax1.set_ylabel('prediction accuracy', color='b')
    # for tl in ax1.get_yticklabels():
    #     tl.set_color('b')
    # ax2 = ax1.twinx()
    # ax2.plot(accu['x'], accu['time'], 'ro-')
    # ax2.set_ylabel('training time in sceonds', color='r')
    # for tl in ax2.get_yticklabels():
    #     tl.set_color('r')
    #
    # plt.title("effect of droppout")
    # ax1.legend(["test accuracy", "train accuracy"], loc="center left")
    #
    # axbox = ax1.get_position()
    #
    # ax2.legend(["training time"], loc=(axbox.x0 - 0.1, axbox.y0 + 0.25))
    # plt.show()

def plot_accuracy_scaling_with_training_example():
    # accu = {"train": [], "test": [], "epoch_time": [], "x": [50000, 30000, 10000, 5000, 3000, 1000]}
    # for n in accu["x"]:
    #     go_data = gp.parse_games(num_games=n, first_n_moves=10, onehot=True)
    #     train_accuracy, test_accuracy, dummy, epoch_time = dnn_go.basic_3layer_NN(
    #         go_data, hidden_layer_num=2000)
    #     accu["train"].append(train_accuracy)
    #     accu["test"].append(test_accuracy)
    #     accu["epoch_time"].append(epoch_time)
    #     print n
    #     print train_accuracy
    #     print test_accuracy
    #     print epoch_time, "seconds"
    #     gc.collect()
    # print accu
    # with open("generated_data/first_10/sample_size_accuracy.pkl", "w") as f:
    #     f.write(pickle.dumps(accu))
    #     f.close()

    with open("generated_data/first_10/sample_size_accuracy.pkl", "r") as f:
        accu = pickle.loads(f.read())
        f.close()
    print accu

    fig, ax1 = plt.subplots()
    ax1.plot(accu['x'], accu['test'], 'bo-')
    ax1.plot(accu['x'], accu['train'], 'b*-')
    ax1.set_xlabel("number of games as training data")
    # Make the y-axis label and tick labels match the line color.
    ax1.set_ylabel('prediction accuracy', color='b')
    for tl in ax1.get_yticklabels():
        tl.set_color('b')
    ax2 = ax1.twinx()
    ax2.plot(accu['x'], accu['epoch_time'], 'ro-')
    ax2.set_ylabel('epoch time in sceonds', color='r')
    for tl in ax2.get_yticklabels():
        tl.set_color('r')

    plt.title("accurayc scaling with more training data")
    ax1.legend(["test accuracy", "train accuracy"], loc="lower center")
    ax2.legend(["epoch time"], loc="lower right")
    plt.show()

def plot_hidden_node_and_accuracy():
    accu = {"train": [], "test": []}
    go_data = gp.parse_games(num_games=10000, first_n_moves=10, onehot=True)
    for hidden_nodes in range(100, 1100, 100) + range(1500, 6500, 500):
        train_accuracy, test_accuracy = dnn_go.basic_3layer_NN(go_data, hidden_layer_num=hidden_nodes)
        accu["train"].append(train_accuracy)
        accu["test"].append(test_accuracy)
        print hidden_nodes
        print train_accuracy
        print test_accuracy
    print accu
    with open("generated_data/first_10/hidden_nodes_accuracy.pkl", "w") as f:
        f.write(pickle.dumps(accu))

    with open("generated_data/first_10/hidden_nodes_accuracy.pkl", "r") as f:
        accuracies = pickle.loads(f.read())
        f.close()

    x = range(100, 1100, 100) + range(1500, 6500, 500)

    plt.plot(x, accuracies["train"], "r")
    plt.plot(x, accuracies["test"], "g")
    legend=["train accuracy", "test accuracy"]
    plt.xlabel("number hidden nodes")
    plt.ylabel("accuracy")
    plt.title("prediction accuracy with different number of hidden nodes")
    plt.legend(legend, loc="best")
    plt.show()

def get_prediction_example():
    prob, board, move = gp.basic_3layer_NN(
        num_games=1000, first_n=10, epoch=20, move_only=True)
    print board
    print move
    print prob

    with open("generated_data/first_10/probability_10_step", "w") as f:
        f.write(pickle.dumps([prob, board, move]))
        f.close()


def draw_board_probabilities_10_step():
    with open("/Users/Molly/Desktop/CMPS218 Deep Learning/AlphaGoPolicyNet/generated_data/probs_first_10.pkl", "r") as f:
        result = pickle.loads(f.read())
        probs, boards, moves = result['probs'], result['boards'], result['moves']
        f.close()

    i = 2
    board = np.array(boards[i]).reshape((19, 19))
    move = np.array(moves[i]).reshape((19, 19))
    prob = np.array(probs[i]).reshape((19, 19))

    board = (board * 2).astype(int)

    vz.draw_board(board, move, prob)


def plot_accuracy_decay_over_moves():
    # test_accu = {1000: [], 5000: [], 20000: []}
    # for n in [1000, 5000, 20000]:
    #     for move in range(1, 21):
    #         go_data = gp.parse_games(num_games=n, first_n_moves=move, onehot=True)
    #         dummy1, test_accuracy, dummy2 = dnn_go.basic_3layer_NN(
    #             go_data, verbose=False, hidden_layer_num=2000)
    #         test_accu[n].append(test_accuracy)
    #         print "num games = %d, moves = %d, accuracy=%f" %(n, move, test_accuracy)
    # with open("generated_data/accuracy_decay", "w") as f:
    #     f.write(pickle.dumps(test_accu))

    with open("generated_data/accuracy_decay", "r") as f:
        result = pickle.loads(f.read())
        f.close()
    legend = []
    for num_game, accuracies in result.iteritems():
        plt.plot(range(1, 21), accuracies)
        legend.append(str(num_game) + " training games")

    plt.xlabel("number of moves")
    plt.ylabel("prediction accuracy")
    plt.title("decreasing prediction accuracy with increasing board complexity")
    plt.legend(legend, loc="bestdfd")
    plt.show()


def draw_board_probabilities():
    with open("probabilitiy_of_open_game", "r") as f:
        probs = pickle.loads(f.read())
        f.close()

    open_moves =gp.map_1d_to_2d(get_open_move())
    vz.draw_openning_board([], probs['All'])

def get_open_move():
    go_data = gp.parse_games(num_games=100, first_n_moves=1)
    open_moves = go_data.train.labels
    for i in [60, 72, 288, 300]:
        print i, len(open_moves[open_moves == i])
    return open_moves

if __name__ == '__main__':
    main()