Untitled

# -*- coding: utf-8 -*-
"""
Created on Mon Dec 10 20:35:34 2018

@author: Jaymon
"""

import tkinter as tk  # python 3
from tkinter import font  as tkfont  # python 3]
from tkinter import filedialog
from matplotlib.widgets import Slider
from tkinter import *

import pandas as pd
import numpy as np

try:
    import pygraphviz
    from networkx.drawing.nx_agraph import graphviz_layout
except ImportError:
    try:
        import pydot
        from networkx.drawing.nx_pydot import graphviz_layout
    except ImportError:
        raise ImportError("This script needs Graphviz and either "
                          "PyGraphviz or pydot")
import matplotlib
import matplotlib.cm as cm
from matplotlib.colors import Normalize
import networkx as nx

# Import backend of matplotlib
matplotlib.use("TkAgg")
from matplotlib.backends.backend_tkagg import FigureCanvasTkAgg, NavigationToolbar2Tk

from matplotlib.figure import Figure

hierarchyfile = 'profile_semantic_trafo_final_hierarchy.txt'
datafile = 'profile_semantic_trafo_final.txt'
df = pd.read_table(datafile, delim_whitespace=True)


def remove_substring(string, array):
    """
 Input:
     string = string to be removed
     arrays = array of arrays which contain strings
 Output: cleaned array
 """
    i = 0
    while i < len(array):
        array[i] = array[i].replace(string, '')
        i = i + 1
    return array


def range_aggregate(sdf, col, size):
    """
    Aggregated the values in col to bins of the width of size.

    Input
    ----------
    df = Dataframe time value in col
    col = Column with time value
    size = the width of the filter

    Output
    ----------
    Dataframe object
    """
    df = sdf
    times = df[col].unique()
    if size < len(times) / 2 and size > 1:
        aggregated = {}
        i = 0
        time = 0
        while time < len(times):
            if i == 0:
                try:
                    name = str(times[time]) + '-' + str(times[size + time - 1])
                except:
                    name = str(times[time]) + '-' + str(times[-1])
            aggregated[str(times[time])] = name
            i = i + 1
            time = time + 1
            if i == size:
                i = 0
        df[col + '_grouped'] = df[col].apply(str)
        df[col + '_grouped'] = df[col + '_grouped'].map(aggregated)
    else:
        sdf[col] = sdf[col].apply(str)
    return df


def hierarchy_aggregate(sdf, cols, depth, hierarchy_file):
    """
    Turns all of the columns in cols into hierarchy strings trimed to a
    maximum depth.

    Input
    ----------
    df = Dataframe
    cols = Array with column values
    depth = depth of hierarchy

    Output
    ----------
    DataFrame with an aditional col for each col in cols
    """
    df = sdf
    # Import hierarchy names
    hierarchy = open(hierarchy_file)
    filenames = []
    for line in hierarchy:
        line = line.rstrip()
        filenames.append(line)
    hierarchy.close()

    # Clean files
    minval = min([min(df['start']), min(df['target'])])
    i = 0
    while i < minval - 1:
        strlen = 1
        line = filenames[i]
        while string_in_arrays(line[:strlen], filenames):
            strlen = strlen + 1
            if strlen > len(line):
                break
        i = i + 1
    filenames = remove_substring(filenames[i][:strlen - 1], filenames)

    # Transfer strings to lists
    arr = 0
    while arr < len(filenames):
        if not filenames[arr] == []:
            filenames[arr] = filenames[arr].strip('/')
            filenames[arr] = filenames[arr].split('/')
            # Cuts off unrequested detail
            if len(filenames[arr]) > depth:
                filenames[arr] = filenames[arr][:depth]
        arr = arr + 1

    # Adds file lists to dictionary
    index = 0
    names = {}
    number = 0
    numbers = {}
    while index < len(filenames):
        names[index + 1] = filenames[index]
        index = index + 1

    # Creates new columns for the arrays
    for col in cols:
        df[col + '_location'] = df[col].map(names)
        df[col + '_location'] = df[col + '_location'].apply(str)
    return df


def string_in_arrays(string, array):
    """
 Input:
     string = string to be found
     arrays = array of arrays which contain strings
 Output: Bool, string in all the arrays
 """
    for str in array:
        if not string in str:
            return False
    return True


def radialNodeLinkVis(G):
    pos = graphviz_layout(G, prog='twopi', args='')
    plt.figure(figsize=(8, 8))
    nx.draw(G, pos, node_size=20, alpha=0.5, node_color="blue", with_labels=False)
    plt.axis('equal')
    return (plt.show())


class SampleApp(tk.Tk):

    def __init__(self, *args, **kwargs):
        tk.Tk.__init__(self, *args, **kwargs)

        self.title_font = tkfont.Font(family='Helvetica', size=18, weight="bold", slant="italic")

        # the container is where we'll stack a bunch of frames
        # on top of each other, then the one we want visible
        # will be raised above the others
        container = tk.Frame(self)
        container.pack(side="top", fill="both", expand=True)
        container.grid_rowconfigure(0, weight=1)
        container.grid_columnconfigure(0, weight=1)

        self.frames = {}
        for F in (StartPage, PageOne, PageTwo):
            page_name = F.__name__
            frame = F(parent=container, controller=self)
            self.frames[page_name] = frame

            # put all of the pages in the same location;
            # the one on the top of the stacking order
            # will be the one that is visible.
            frame.grid(row=0, column=0, sticky="nsew")

        self.show_frame("StartPage")

    def show_frame(self, page_name):
        '''Show a frame for the given page name'''
        frame = self.frames[page_name]
        frame.tkraise()

    def sel_df(self):
        # Select the txt file of the dataset
        self.path_df = filedialog.askopenfilename(initialdir="/", title
        ="Select file", filetypes
                                                  =(("txt files", "*.txt"),
                                                    ("all files", "*.*")))
        # Create df out of it and store it
        self.df = pd.read_table(self.path_df, delim_whitespace=True)

    def sel_df_hier(self):
        # Select the txt file of the hierarchy dataset.
        self.path_df_hier = filedialog.askopenfilename(initialdir="/", title
        ="Select file", filetypes
                                                       =(("txt files", "*.txt"),
                                                         ("all files", "*.*")))
        # Create df out of it and store it
        self.df_hier = pd.read_table(self.path_df_hier, delim_whitespace=True)


class StartPage(tk.Frame):

    def __init__(self, parent, controller):
        tk.Frame.__init__(self, parent)
        self.controller = controller
        label = tk.Label(self, text="GUI group X", font=controller.title_font)
        label.pack(side="top", fill="x", pady=10)

        button1 = tk.Button(self, text="Import main file",
                            command=lambda: controller.sel_df())
        button2 = tk.Button(self, text="Import hierarchy file",
                            command=lambda: controller.sel_df_hier())
        button3 = tk.Button(self, text="Adjacency matrix and Dynamic Graph",
                            command=lambda: controller.show_frame("PageOne"))
        button4 = tk.Button(self, text="Exercise 7",
                            command=lambda: controller.show_frame("PageTwo"))

        button1.pack()
        button2.pack()
        button3.pack()
        button4.pack()


class PageOne(tk.Frame):

    def __init__(self, parent, controller):
        tk.Frame.__init__(self, parent)
        self.controller = controller
        label = tk.Label(self, text="Adjacency Matrix and Dynamic Graph", font=controller.title_font)
        label.pack(side="top", fill="x", pady=10)
        button = tk.Button(self, text="Go to the start page",
                           command=lambda: controller.show_frame("StartPage"))
        button.pack()

        #Label and entry for min time
        label_min_t = StringVar()
        label_min_t.set("Enter desired value for minimum time:")
        label_min_t_dir = Label(self, textvariable=label_min_t)
        label_min_t_dir.pack(side='left', fill="x", pady=10)

        e_min_t = Entry(self, width=10)
        # Set place holder
        e_min_t.insert(END, "0")
        e_min_t.pack(side='left', fill="x", pady=10)

        label_max_t = StringVar()
        label_max_t.set("Enter desired value for maximum time:")
        label_max_t = Label(self, textvariable=label_min_t)
        label_max_t.pack(side='left', fill="x", pady=10)

        #Label and entry for max time
        e_max_t = Entry(self, width=10)
        # Set place holder
        e_max_t.insert(END, "300")
        e_max_t.pack(side='left', fill="x", pady=10)

        button_update = tk.Button(self, text="Update",
                                  command=lambda: self.update(e_min_t.get(), e_max_t.get(),
                                                              cmapvar.get()))
        button_update.pack(side='left', fill="x", pady=10)

        label_cmap = StringVar()
        label_cmap.set("Select desired colormap:")
        label_cmap = Label(self, textvariable=label_cmap)
        label_cmap.pack(side="top", fill="x", pady=10)

        cmapvar = StringVar()
        cmap_choices = {"YlOrRd", "Blues", "cubehelix_r", "gist_rainbow_r",
                        "gist_stern_r", "plasma", "nipy_spectral_r"}
        cmapvar.set("RdY1Gn")

        cmap_menu = OptionMenu(self, cmapvar, *cmap_choices)
        cmap_menu.pack(side="top")

        self.print_graph(df, 'time', 'start', 'target', hierarchyfile, 1, 5, "cubehelix_r", weight='weight',
                         min_time=1, max_time=300, min_weight=0, max_weight='max')

        # Create canvas
        self.canvas = FigureCanvasTkAgg(self.fig, self)
        self.canvas.draw()
        self.canvas.get_tk_widget().pack(side=tk.TOP, fill=tk.BOTH, expand=True)

        # Add standard-layout
        toolbar = NavigationToolbar2Tk(self.canvas, self)
        toolbar.update()
        self.canvas._tkcanvas.pack(side="top", fill="x", pady=10)

    # Update the graph with user input values.
    def update(self, var_min_t, var_max_t, cmap):
        self.print_graph(df, 'time', 'start', 'target', hierarchyfile, 1, 5, cmap, weight='weight',
                         min_time=int(var_min_t), max_time=int(var_max_t), min_weight=0, max_weight='max', a=self.a,)
        print('processed')
        self.canvas.draw()
        print('drawn')

    def print_graph(self, sdf, time, start, target, hierarchy, width, depth, colormap, weight='weight',
                    min_time='min', max_time='max', min_weight='min', max_weight='max', a=True):
        """
        Prints a dynamic graph visualisation by drawing the static graphs of each
        timeslot ontop of each other. Incorperates a range of filering and
        aggregation tools.

        Input
        ----------
        sdf = DataFrame with dynamic graph data
        time = time column of sdf DataFrame
        start = vertex column of sdf DataFrame where edges start
        target = vertex column of sdf DataFrame where edges end
        hierarchy = file where the hierarchy is stored, linked to values of vertices
        width = width in time steps of the time
        depth = maximum depth of hierarchy values
        weight = weight column of sdf DataFrame, default = 'weight'
        min_time = minimum value of time, default = minimum of sdf[time]
        max_time = maximum value of time, default = maximum of sdf[time]
        min_weight = minimum value of weight, default = minimum of sdf[weight]
        max_weight = maximum value of weight, default = maximum of sdf[weight]
        colormap = chosen colormap


        Output
        ----------
        Returns a Figure object

        """

        # Filter Dataset
        sdf = sdf.copy()
        if min_time == 'min':
            min_list = sdf[time] >= sdf[time].min()
        else:
            min_list = sdf[time] >= min_time
        if max_time == 'max':
            max_list = sdf[time] <= sdf[time].max()
        else:
            max_list = sdf[time] <= max_time
        sdf = sdf[min_list & max_list]

        # recycle the list names
        if min_weight == 'min':
            min_list = sdf[weight] >= sdf[weight].min()
        else:
            min_list = sdf[weight] >= min_weight
        if max_weight == 'max':
            max_list = sdf[weight] <= sdf[weight].max()
        else:
            max_list = sdf[time] <= max_weight
        sdf = sdf[min_list & max_list]

        # Transform Weights
        sdf['weight'] = sdf['weight'].apply(np.log10)
        sdf = sdf[min_list & max_list]

        # Aggregates dataset
        sdf = range_aggregate(sdf, time, width)
        sdf = hierarchy_aggregate(sdf, [start, target], depth, hierarchy)

        # Set aggregated names
        time_agg = time + '_grouped'
        start_agg = start + '_location'
        target_agg = target + '_location'
        headers = sdf.dtypes.index

        # Checks if aggregate columns exist
        if time_agg in headers:
            time = time_agg
        if start_agg in headers and target_agg in headers:
            start = start_agg
            target = target_agg
        print(len(sdf))
        sdf['freq'] = sdf.groupby([time, start, target])['weight'].transform('count')

        print(len(sdf))
        # Setup variables for creating the graph
        times = sdf[time].unique()
        end = {}
        self.fig = Figure(figsize=(12, 8), dpi=100)
        if not a == True:
            a.clear()
            self.a = a
        else:
            self.fig = Figure(figsize=(12, 8), dpi=100)
            self.a = self.fig.add_subplot(111)

        self.a.get_xaxis().set_visible(False)
        self.a.get_yaxis().set_visible(False)
        offset = 5
        i = 0

        # Creates dict for the end location of lines
        while i < len(times):
            try:
                end[times[i]] = times[i + offset]
            except:
                end[times[i]] = 'end+' + str(i + offset - len(times))
            i = i + 1

        norm = Normalize(vmin=sdf['weight'].min(), vmax=sdf['weight'].max())
        cmap = cm.get_cmap(name=colormap)
        m = cm.ScalarMappable(norm=norm, cmap=cmap)

        # Plots every row in the dataframe to the plot
        for index, row in sdf.iterrows():
            x = [row[time], end[row[time]]]
            y = [row[start], row[target]]
            self.a.plot(x, y, alpha=0.3, c=m.to_rgba(row['weight']))


class PageTwo(tk.Frame):

    def __init__(self, parent, controller):
        tk.Frame.__init__(self, parent)
        self.controller = controller
        label = tk.Label(self, text="Exercise 7", font=controller.title_font)
        label.pack(side="top", fill="x", pady=10)
        button = tk.Button(self, text="Go to the start page",
                           command=lambda: controller.show_frame("StartPage"))
        button.pack()


if __name__ == "__main__":
    app = SampleApp()
    app.mainloop()