Source code for rivus.io.db

import warnings
from datetime import datetime
from pandas import Series, DataFrame, read_sql
from geopandas import GeoDataFrame
from shapely.wkt import loads as wkt_load
import json
from ..main.rivus import get_timeseries, get_constants


[docs]def init_run(engine, runner='Havasi', start_ts=None, status='prepared',
             outcome='not_run', comment=None, plot_dict=None, profiler=None):
    """Initialize the `run` table with basic info.

    Parameters
    ----------
    engine : sqlalchemy engine whit psycopg2 driver
        For managing connection to the DB.
    runner : str, optional
        Person's name/identifier who created(executed) the data(process).
    start_ts : datetime.datetime, optional
        Timezone-less datetime object.
        If omitted, .now() will be used.
    status : str, optional
        One of the following strings:
        | 'prepared' (default) | 'run' | 'error'
    outcome : str, optional
        One of the following strings:
        | 'not_run'  (default) | 'optimum' | 'optimum_not_found' | 'error'
    comment : str, optional
        Any text based comment. (No length limit.)
    plot_dict : dict, optional
        Dictionary returned by the rivus.io.plot.fig3d function.
    profiler : pandas.Series, optional
        Series containing profiled process name and execution time pairs.
        Execution time is measured in *seconds*

    Returns
    -------
    int
        run_id of the initialized run row in the DB.
    """
    if start_ts is None:
        start_ts = datetime.now()

    if profiler is not None:
        profiler = profiler.to_json()

    if plot_dict is not None:
        plot = json.dumps(plot_dict)
    else:
        plot = None

    run_id = None
    connection = engine.raw_connection()
    try:
        with connection.cursor() as curs:
            curs.execute("""
                INSERT INTO run (runner, start_ts, status, outcome, comment,
                                 plot, profiler)
                VALUES (%s, %s, %s, %s, %s, %s, %s)
                RETURNING run_id;
                """, (runner, start_ts, status, outcome, comment, plot,
                      profiler))
            run_id = curs.fetchone()[0]
            connection.commit()
    finally:
        connection.close()
    return run_id


def _purge_table(engine, table, run_id):
    """Delete rows in `table` which are related to `run_id`.

    Parameters
    ----------
    engine : sqlalchemy engine whit psycopg2 driver
        For managing connection to the DB.
    table : str
        An existing table in database 'rivus_db'
        See: [rivus_db](https://github.com/lnksz/rivus_db)
    run_id : int
        run_id of the initialized run row in the DB.
        Used to identify related data to be removed:
        directly (table has `run_in` as FK) and
        indirectly (table has FK of an Entity with `run_id` FK)

    Returns
    ------------------
    None
    """

    if table in ['process', 'commodity', 'edge', 'vertex', 'area', 'time',
                 'cost']:
        # These have run_id as FK
        connection = engine.raw_connection()
        try:
            with connection.cursor() as curs:
                curs.execute("""
                    DELETE FROM "{}"
                    WHERE run_id = %s;
                    """.format(table), [run_id, ])
                connection.commit()
        finally:
            connection.close()
    elif table in ['process_commodity', 'vertex_source', 'area_demand',
                   'time_demand', 'pmax', 'flow', 'source']:
        # These have commodity_id as FK
        connection = engine.raw_connection()
        try:
            with connection.cursor() as curs:
                curs.execute("""
                    DELETE FROM {0} USING commodity
                    WHERE {0}.commodity_id = commodity.commodity_id AND
                          commodity.run_id = %s;
                    """.format(table), (run_id, ))
                connection.commit()
        finally:
            connection.close()
    elif table in ['edge_demand', 'time_hub', 'kappa_hub']:
        # These have edge_id as FK
        connection = engine.raw_connection()
        try:
            with connection.cursor() as curs:
                curs.execute("""
                    DELETE FROM {0} USING edge
                    WHERE {0}.edge_id = edge.edge_id AND
                          edge.run_id = %s;
                    """.format(table), (run_id, ))
                connection.commit()
        finally:
            connection.close()
    elif table in ['kappa_process']:
        # These have vertex_id as FK
        connection = engine.raw_connection()
        try:
            with connection.cursor() as curs:
                curs.execute("""
                    DELETE FROM {0} USING vertex
                    WHERE {0}.vertex_id = edge.vertex_id AND
                          vertex.run_id = %s;
                    """.format(table), (run_id, ))
                connection.commit()
        finally:
            connection.close()
    else:
        warnings.warn("<{}> is not recognized."
                      "So it was not purged from database".format(table))


[docs]def purge_run(engine, run_id):
    """Delete all rows related to run_id across all tables.
    **This is not a throughout reliable function, and can do some harm.
    Use it with caution, and at your own risk!**

    Parameters
    ----------
    engine : sqlalchemy engine whit psycopg2 driver
        For managing connection to the DB.
    run_id : int
        run_id of the initialized run row in the DB.
        Used to identify related data to be removed:
        directly (table has `run_in` as FK) and
        indirectly (table has FK of an Entity with `run_id` FK)

    Returns
    -------
    None
    """
    # Table order matters: reverse of `store()` logic.
    results = ['source', 'cost', 'pmax', 'kappa_hub', 'kappa_process',
               'time_hub', 'flow']
    second_gen = ['process_commodity', 'vertex_source', 'edge_demand',
                  'area_demand', 'time_demand']
    first_gen = ['edge', 'vertex', 'area', 'time', 'process', 'commodity']
    tables = results + second_gen + first_gen
    for table in tables:
        _purge_table(engine, table, run_id)


def _handle_geoframe(engine, frame, df, run_id):
    """Before inserting to the DB, convert `geometries` column to WKT.

    Parameters
    ----------
    engine : sqlalchemy engine whit psycopg2 driver
        For managing connection to the DB.
    frame : str
        Name of the DataFrame as in `prob.params[]`
    df : GeoDataFrame
        as retrieved from ˙prog.param[]`
    run_id : int
        run_id of the initialized run row in the DB.

    Returns
    -------
    None
    """
    if frame == 'vertex':
        cols = ['run_id', 'vertex_num', 'geometry']
        vals = '%s, %s, ST_GeogFromText(%s)'
    elif frame == 'edge':
        cols = ['run_id', 'edge_num', 'vertex1', 'vertex2', 'geometry']
        vals = '%s, %s, %s, %s, ST_GeogFromText(%s)'

    cols = ','.join(cols)
    string_query = """
        INSERT INTO {0} ({1})
        VALUES ({2});
        """.format(frame, cols, vals)

    connection = engine.raw_connection()
    try:
        for key, row in df.iterrows():
            wkt = row['geometry'].wkt
            with connection.cursor() as curs:
                if frame == 'vertex':
                    curs.execute(string_query, (run_id, int(key), wkt))
                if frame == 'edge':
                    v1, v2 = key
                    curs.execute(string_query, (run_id, row['Edge'],
                                                v1, v2, wkt))
                # run_id = curs.fetchone()[0]
                connection.commit()
    finally:
        connection.close()


def _handle_graph(engine, graph_dict, run_id):
    """Insert the results of the graph analysis into the proper table.

    Parameters
    ----------
    engine : sqlalchemy engine whit psycopg2 driver
        For managing connection to the DB.
    graph_dict : dict
        Analysis results. Keys:
        - commodity: String denotation. e.g. 'Elec'
        - is_connected: Boolean.
        - connected_components: Int. Number of connected components.
        - is_minimal: Boolean.
            Is the graph also a minimal spanning tree/forest?
    run_id : int
        run_id of the initialized run row in the DB.
    """
    values = dict(graph_dict, run_id=run_id)
    connection = engine.raw_connection()
    try:
        with connection.cursor() as curs:
            curs.execute("""
                 INSERT INTO graph_analysis (commodity_id, is_connected,
                                             connected_components, is_minimal)
                 VALUES (
                     (SELECT commodity_id FROM commodity
                      WHERE run_id = %(run_id)s AND
                         commodity LIKE %(commodity)s),
                     %(is_connected)s,
                     %(connected_components)s,
                     %(is_minimal)s);
                 """, values)
            connection.commit()
    finally:
        connection.close()


def _fill_table(engine, frame, df, run_id):
    """Insert data to db.table from dataframe.

    Parameters
    ----------
    engine : sqlalchemy engine whit psycopg2 driver
        For managing connection to the DB.
    frame : str
        Name of the DataFrame from which data will be exported to DB.
    df : DataFrame
        Expected is a DataFrame, which is an input or output of the rivus
        ConcreteModel. (create_model(), solve(), ...)
    run_id : int
        run_id of the initialized run row in the DB.

    Returns
    -------
    TYPE
        Description
    """
    col_map = {
        'Edge': 'edge_num',
        'allowed-max': 'allowed_max',
        'cap-max': 'cap_max',
        'cap-min': 'cap_min',
        'cost-fix': 'cost_fix',
        'cost-inv-fix': 'cost_inv_fix',
        'cost-inv-var': 'cost_inv_var',
        'cost-var': 'cost_var',
        'loss-fix': 'loss_fix',
        'loss-var': 'loss_var',
    }
    if frame == 'commodity':
        sql_df = df.rename(columns=col_map)
        sql_df['run_id'] = run_id
        sql_df.to_sql(frame, engine, if_exists='append', index_label=frame)
    elif frame == 'process':
        sql_df = df.loc[:, 'cost-inv-fix':'cap-max'].rename(columns=col_map)
        sql_df['run_id'] = run_id
        sql_df.to_sql(frame, engine, if_exists='append', index_label=frame)
    elif frame == 'edge':
        sql_df = df.loc[:, ('Edge', 'geometry')]
        _handle_geoframe(engine, frame, sql_df, run_id)
        df = df.loc[:, [c for c in df.columns.values if c != 'geometry']]
        connection = engine.raw_connection()
        try:
            for _, row in df.iterrows():
                for col, demand in row.iteritems():
                    if col == 'Edge':
                        continue
                    values = dict(edge=int(row['Edge']), building=col,
                                  demand=int(demand), run_id=run_id)
                    with connection.cursor() as curs:
                        curs.execute("""
                            INSERT INTO edge_demand
                            (edge_id, area_id, value)
                            VALUES (
                                (SELECT edge_id FROM edge
                                 WHERE run_id = %(run_id)s AND
                                       edge_num = %(edge)s),
                                (SELECT area_id FROM "area"
                                 WHERE run_id = %(run_id)s AND
                                       building_type LIKE %(building)s),
                                %(demand)s);
                            """, values)
                        connection.commit()
        finally:
            connection.close()
    elif frame == 'vertex':
        sql_df = df.geometry.to_frame()
        _handle_geoframe(engine, frame, sql_df, run_id)
        df = df.loc[:, [c for c in df.columns.values if c != 'geometry']]
        connection = engine.raw_connection()
        try:
            for ver, row in df.iterrows():
                for comm, val in row.iteritems():
                    values = dict(vertex=int(ver), commodity=comm,
                                  value=int(val), run_id=run_id)
                    with connection.cursor() as curs:
                        curs.execute("""
                            INSERT INTO vertex_source
                            (vertex_id, commodity_id, value)
                            VALUES (
                                (SELECT vertex_id FROM vertex
                                 WHERE run_id = %(run_id)s AND
                                       vertex_num = %(vertex)s),
                                (SELECT commodity_id FROM commodity
                                 WHERE run_id = %(run_id)s AND
                                       commodity LIKE %(commodity)s),
                                %(value)s);
                            """, values)
                        connection.commit()
        finally:
            connection.close()
    elif frame == 'time':
        sql_df = df.loc[:, 'weight'].to_frame()
        sql_df['run_id'] = run_id
        sql_df.to_sql(frame, engine, if_exists='append',
                      index_label='time_step')
        df = df.loc[:, [c for c in df.columns.values if c != 'weight']]
        connection = engine.raw_connection()
        try:
            for ts, row in df.iterrows():
                for comm, val in row.iteritems():
                    values = dict(time_step=ts, commodity=comm,
                                  value=float(val), run_id=run_id)
                    with connection.cursor() as curs:
                        curs.execute("""
                            INSERT INTO time_demand
                            (time_id, commodity_id, scale)
                            VALUES (
                                (SELECT time_id FROM "time"
                                 WHERE run_id = %(run_id)s AND
                                       time_step = %(time_step)s),
                                (SELECT commodity_id FROM commodity
                                 WHERE run_id = %(run_id)s AND
                                       commodity LIKE %(commodity)s),
                                %(value)s);
                            """, values)
                        connection.commit()
        finally:
            connection.close()
    elif frame == 'area_demand':
        area_types = df.unstack(level='Commodity').index.values
        sql_df = DataFrame(dict(building_type=area_types,
                                run_id=[run_id] * len(area_types)))
        sql_df.to_sql('area', engine, if_exists='append', index=False)
        connection = engine.raw_connection()
        try:
            for key, row in df.iterrows():
                values = dict(row, area=key[0], commodity=key[1],
                              run_id=run_id)
                with connection.cursor() as curs:
                    curs.execute("""
                        INSERT INTO area_demand
                        (area_id, commodity_id, peak)
                        VALUES (
                            (SELECT area_id FROM area
                             WHERE run_id = %(run_id)s AND
                                   building_type LIKE %(area)s),
                            (SELECT commodity_id FROM commodity
                             WHERE run_id = %(run_id)s AND
                                   commodity LIKE %(commodity)s),
                            %(peak)s);
                        """, values)
                    connection.commit()
        finally:
            connection.close()
    elif frame == 'process_commodity':
        connection = engine.raw_connection()
        try:
            for key, row in df.iterrows():
                values = dict(row, process=key[0], commodity=key[1],
                              direction=key[2].lower(), run_id=run_id)
                with connection.cursor() as curs:
                    curs.execute("""
                        INSERT INTO process_commodity
                        (process_id, commodity_id, direction, ratio)
                        VALUES (
                            (SELECT process_id FROM process
                             WHERE run_id = %(run_id)s AND
                                   process LIKE %(process)s),
                            (SELECT commodity_id FROM commodity
                             WHERE run_id = %(run_id)s AND
                                   commodity LIKE %(commodity)s),
                            %(direction)s,
                            %(ratio)s);
                        """, values)
                    connection.commit()
        finally:
            connection.close()
    elif frame == 'source':
        connection = engine.raw_connection()
        try:
            df.fillna(0, inplace=True)
            for (vertex, comm), row in df.iterrows():
                for time_step, val in row.iteritems():
                    values = dict(run_id=run_id, vertex=vertex, commodity=comm,
                                  time_step=time_step, value=int(val))
                    with connection.cursor() as curs:
                        curs.execute("""
                            INSERT INTO {0}
                            (vertex_id, commodity_id, time_id, capacity)
                            VALUES (
                                (SELECT vertex_id FROM vertex
                                 WHERE run_id = %(run_id)s AND
                                       vertex_num = %(vertex)s),
                                (SELECT commodity_id FROM commodity
                                 WHERE run_id = %(run_id)s AND
                                       commodity LIKE %(commodity)s),
                                (SELECT time_id FROM "time"
                                 WHERE run_id = %(run_id)s AND
                                       time_step = %(time_step)s),
                                %(value)s);
                            """.format(frame), values)
                        connection.commit()
        finally:
            connection.close()
    elif frame in ['flow', 'hub', 'proc_io', 'proc_tau']:
        warnings.warn("<{}> is not implemented yet. "
                      "This frame was not inserted to the database"
                      .format(frame))
    elif frame == 'cost':
        series = df.rename(dict(Inv='investment', Fix='fix', Var='variable'))
        values = {k: int(v) for k, v in series.iteritems()}
        values['run_id'] = run_id
        connection = engine.raw_connection()
        try:
            with connection.cursor() as curs:
                curs.execute("""
                    INSERT INTO {0} (run_id, variable, investment, fix)
                    VALUES (%(run_id)s, %(variable)s, %(investment)s, %(fix)s);
                    """.format(frame), values)
                connection.commit()
        finally:
            connection.close()
    elif frame == 'pmax':
        connection = engine.raw_connection()
        try:
            for (v1, v2), row in df.iterrows():
                for comm, val in row.iteritems():
                    values = dict(va=v1, vb=v2, commodity=comm, val=int(val),
                                  run_id=run_id)
                    with connection.cursor() as curs:
                        curs.execute("""
                            INSERT INTO {0} (edge_id, commodity_id, capacity)
                            VALUES (
                                (SELECT edge_id FROM edge
                                 WHERE run_id = %(run_id)s AND
                                       vertex1 = %(va)s AND vertex2 = %(vb)s),
                                (SELECT commodity_id from commodity
                                 WHERE run_id = %(run_id)s AND
                                       commodity LIKE %(commodity)s),
                                %(val)s);
                            """.format(frame), values)
                        connection.commit()
        finally:
            connection.close()
    elif frame == 'kappa_hub':
        connection = engine.raw_connection()
        try:
            for (v1, v2), row in df.iterrows():
                for hub, val in row.iteritems():
                    values = dict(va=v1, vb=v2, hub=hub, val=int(val),
                                  run_id=run_id)
                    with connection.cursor() as curs:
                        curs.execute("""
                            INSERT INTO {0} (edge_id, process_id, capacity)
                            VALUES (
                                (SELECT edge_id FROM edge
                                 WHERE run_id = %(run_id)s AND
                                       vertex1 = %(va)s AND vertex2 = %(vb)s),
                                (SELECT process_id from process
                                 WHERE run_id = %(run_id)s AND
                                       process LIKE %(hub)s),
                                %(val)s);
                            """.format(frame), values)
                        connection.commit()
        finally:
            connection.close()
    elif frame == 'kappa_process':
        connection = engine.raw_connection()
        try:
            for ver, row in df.iterrows():
                for proc, val in row.iteritems():
                    values = dict(vertex=int(ver), process=proc, val=int(val),
                                  run_id=run_id)
                    with connection.cursor() as curs:
                        curs.execute("""
                            INSERT INTO {0} (vertex_id, process_id, capacity)
                            VALUES (
                                (SELECT vertex_id FROM vertex
                                 WHERE run_id = %(run_id)s AND
                                       vertex_num = %(vertex)s),
                                (SELECT process_id from process
                                 WHERE run_id = %(run_id)s AND
                                       process LIKE %(process)s),
                                %(val)s);
                            """.format(frame), values)
                        connection.commit()
        finally:
            connection.close()
    else:
        warnings.warn("<{}> is unknown."
                      "Frame was not inserted to the database".format(frame))
    return


[docs]def store(engine, prob, run_id=None, graph_results=None, run_data=None,
          time_series=None, constants=None):
    """Store I/O plus extras of a rivus model into a postgres DB.

    Parameters
    ----------
    engine : sqlalchemy engine whit psycopg2 driver
        For managing connection to the DB.
    prob : pyomo ConcreteModel
        Created by rivus.create_model()
    run_id : int, optional
        run_id of an initialized run row in the DB.
        If omitted: init_run() will be called with `run_data`.
    graph_results : iterable, optional
        Results of the graph analysis. Each graph should have its own dict.
        For implemented result keys see `_handle_graph`.
        E.g. [{'is_connected':True, 'is_minimal':True}, {'is_connected':True}]
    run_data : dict, optional
        Keyword arguments to be passed to init_run().
        runner, start_ts, status, outcome, comment, plot_dict, profiler
    time_series : None, optional
        TODO If already present at function call, this could save time.
    constants : None, optional
        TODO If already present at function call, this could save time.

    Returns
    -------
    None

    Raises
    ------
    Exception caught during data export.
    """
    if run_id is not None:
        run_id = int(run_id)
    else:
        run_id = init_run(engine, **run_data) if run_data else init_run(engine)
    print('\tStore params for run <{}>'.format(run_id))

    try:
        # Parameter DataFrames
        # --------------------
        # The order of frames -> table does matter.
        # Followings apply to `frames`:
        # `process_commodity` ---> after `process` and `commodity`
        # `vertex`, `area_demand` and `time` ---> after `commodity`
        # `edge` ---> after `area_demand`
        independend = ['commodity', 'process']
        comm_dependent = ['process_commodity', 'area_demand', 'vertex', 'time']
        area_dependent = ['edge']
        frames = independend + comm_dependent + area_dependent
        for frame in frames:
            # frame should be the same as df.name... but GeoDataFrames does not
            # have a name etc..
            df = prob.params[frame]
            _fill_table(engine, frame, df, run_id)

        # Result DataFrames
        # -----------------
        series_names = ['source', 'flow', 'hub', 'proc_io', 'proc_tau']
        series = get_timeseries(prob)  # source, flows, hubs, proc_io, proc_tau
        consts_names = ['cost', 'pmax', 'kappa_hub', 'kappa_process']
        consts = get_constants(prob)  # costs, Pmax, Kappa_hub, Kappa_process

        for df, name in zip(series + consts, series_names + consts_names):
            if not df.empty:
                _fill_table(engine, name, df, run_id)
        if graph_results is not None:
            for g_res in graph_results:
                _handle_graph(engine, g_res, run_id)
    except Exception as e:
        # Note: This is basically a quick'n'dirty transaction rollback.
        # One could dig into sqlalchemy.session to make it more conformal.
        #purge_run(engine, run_id)
        raise e

    # Results DataFrames=======================================================


[docs]def df_from_table(engine, fname, run_id):
    """Extract data form the database into a dataframe in a form,
    that is common during the rivus work-flow.

    Implemented DataFrames:

    * rivus_model.params[] dataframes:

        - process
        - commodity
        - process_commodity
        - edge
        - vertex
        - time
        - area_demand

    * get_timeseries dataframes:

        - source

    * get_constants dataframes:

        - cost
        - pmax
        - kappa_hub
        - kappa_process

    Parameters
    ----------
    engine : sqlalchemy engine whit psycopg2 driver
        For managing connection to the DB.
    fname : str
        One of the implemented dataframes. (See summary.)
    run_id : int
        run_id of an initialized run row in the DB.
        You could query the run table for e.g. start date,
        or join it vertex table and execute a geographical query
        and get the run_id(s) you want to work with

    Returns
    -------
    DataFrame or Series
        depending on the data's dimensions.
        Only `cost` returns a Series to be consequent with get_constants.
    """
    if fname == 'process_commodity':
        sql = """
            SELECT P.process AS "Process",
                   C.commodity AS "Commodity",
                   initcap(PC.direction::text) AS "Direction",
                   PC.ratio AS ratio
            FROM process_commodity AS PC
            INNER JOIN commodity AS C ON PC.commodity_id = C.commodity_id
            INNER JOIN process AS P ON PC.process_id = P.process_id
            where P.run_id = %s;
            """
        df = read_sql(sql, engine, params=(run_id,),
                      index_col=['Process', 'Commodity', 'Direction'])

    elif fname == 'process':
        sql = """
            SELECT process AS "Process",
                   cost_inv_fix AS "cost-inv-fix",
                   cost_inv_var AS "cost-inv-var",
                   cost_fix AS "cost-fix",
                   cost_var AS "cost-var",
                   cap_min AS "cap-min",
                   cap_max AS "cap-max"
            FROM process WHERE run_id = %s;
            """
        df = read_sql(sql, engine, params=(run_id,),
                      index_col='Process')

    elif fname == 'commodity':
        sql = """
            SELECT commodity AS "Commodity", unit,
                   cost_inv_fix AS "cost-inv-fix",
                   cost_inv_var AS "cost-inv-var",
                   cost_fix AS "cost-fix",
                   cost_var AS "cost-var",
                   loss_fix AS "loss-fix",
                   loss_var AS "loss-var",
                   cap_max AS "cap-max",
                   allowed_max AS "allowed-max"
            FROM commodity WHERE run_id = %s;
            """
        df = read_sql(sql, engine, params=(run_id,),
                      index_col='Commodity')

    elif fname == 'edge':
        # Performance Note:
        # A server side solution could be crosstab() from Tabletool extension.
        # https://www.postgresql.org/docs/9.6/static/tablefunc.html
        # But I rather kept the SQL queries simpler, and reshape data in the
        # generally more well-known pandas.DataFrame format.
        sql_demand = """
            SELECT E.vertex1 AS "Vertex1", E.vertex2 AS "Vertex2",
                   A.building_type, ED.value
            FROM edge_demand AS ED
            JOIN edge AS E ON E.edge_id = ED.edge_id
            JOIN area AS A ON A.area_id = ED.area_id
            WHERE E.run_id = %s
            ORDER BY 1,2;
            """
        df_demand = read_sql(sql_demand, engine, params=(run_id,),
                             index_col=['Vertex1', 'Vertex2', 'building_type']
                             ).unstack(level=-1).fillna(0)
        df_demand = df_demand['value']

        sql_edge = """
            SELECT vertex1 AS "Vertex1", vertex2 AS "Vertex2",
                   ST_AsText(geometry) AS "geometry", edge_num AS "Edge"
            FROM edge
            WHERE run_id = %s
            ORDER BY 1,2;
            """
        df_edge = read_sql(sql_edge, engine, params=(run_id,),
                           index_col=['Vertex1', 'Vertex2'])
        df_edge['geometry'] = df_edge['geometry'].apply(wkt_load)

        df = df_edge.join(df_demand)
        df = GeoDataFrame(df)

    elif fname == 'vertex':
        sql_source = """
            SELECT V.vertex_num AS "Vertex",
                   C.commodity, VS.value
            FROM vertex_source AS VS
            JOIN vertex AS V ON V.vertex_id = VS.vertex_id
            JOIN commodity AS C ON C.commodity_id = VS.commodity_id
            WHERE V.run_id = %s
            ORDER BY 1,2;
            """
        df_source = read_sql(sql_source, engine, params=(run_id,),
                             index_col=['Vertex', 'commodity']
                             ).unstack(level=-1).fillna(0)
        df_source = df_source['value']

        sql_vertex = """
            SELECT vertex_num AS "Vertex", ST_AsText(geometry) AS "geometry"
            FROM vertex
            WHERE run_id = %s
            ORDER BY 1,2;
            """
        df_vertex = read_sql(sql_vertex, engine, params=(run_id,),
                             index_col='Vertex')
        df_vertex['geometry'] = df_vertex['geometry'].apply(wkt_load)

        df = GeoDataFrame(df_vertex.join(df_source))

    elif fname == 'time':
        sql_source = """
            SELECT T.time_step AS "Time", C.commodity, TD.scale
            FROM time_demand AS TD
            JOIN "time" AS T ON T.time_id = TD.time_id
            JOIN commodity AS C ON C.commodity_id = TD.commodity_id
            WHERE T.run_id = %s
            ORDER BY 1,2;
            """
        df_source = read_sql(sql_source, engine, params=(run_id,),
                             index_col=['Time', 'commodity']
                             ).unstack(level=-1).fillna(0)
        df_source = df_source['scale']

        sql_vertex = """
            SELECT time_step AS "Time", weight
            FROM "time"
            WHERE run_id = %s;
            """
        df_vertex = read_sql(sql_vertex, engine, params=(run_id,),
                             index_col='Time')
        df = df_vertex.join(df_source)

    elif fname == 'area_demand':
        sql = """
            SELECT A.building_type AS "Area", C.commodity as "Commodity",
                   AD.peak
            FROM area_demand AS AD
            JOIN area AS A ON A.area_id = AD.area_id
            JOIN commodity AS C ON C.commodity_id = AD.commodity_id
            WHERE A.run_id = %s
            ORDER BY 1,2;
            """
        df = read_sql(sql, engine, params=(run_id,),
                      index_col=['Area', 'Commodity']).fillna(0)

    elif fname == 'source':
        sql = """
            SELECT V.vertex_num AS "vertex", C.commodity,
                   T.time_step as "time", S.capacity
            FROM source AS S
            JOIN vertex AS V ON V.vertex_id = S.vertex_id
            JOIN commodity AS C ON C.commodity_id = S.commodity_id
            JOIN "time" AS T ON T.time_id = S.time_id
            WHERE V.run_id = %s
            ORDER BY 1,2;
            """
        df = read_sql(sql, engine, params=(run_id,),
                      index_col=['vertex', 'commodity', 'time']
                      ).unstack(level=-1).fillna(0)
        df = df['capacity']

    elif fname == 'cost':
        sql = """
            SELECT variable AS "Var", investment AS "Inv", fix as "Fix"
            FROM cost
            WHERE run_id = %s;
            """
        df = read_sql(sql, engine, params=(run_id,))
        if not df.empty:
            df = Series(df.iloc[0], name='costs')

    elif fname == 'pmax':
        sql = """
            SELECT E.vertex1 AS "Vertex1", E.vertex2 AS "Vertex2", C.commodity,
                   P.capacity
            FROM pmax AS P
            JOIN edge AS E ON E.edge_id = P.edge_id
            JOIN commodity AS C ON C.commodity_id = P.commodity_id
            WHERE E.run_id = %s
            ORDER BY 1,2;
            """
        df = read_sql(sql, engine, params=(run_id,),
                      index_col=['Vertex1', 'Vertex2', 'commodity']
                      ).unstack(level=-1).fillna(0)
        df = df['capacity']

    elif fname == 'kappa_hub':
        sql = """
            SELECT E.vertex1 AS "Vertex1", E.vertex2 AS "Vertex2", P.process,
                   KH.capacity
            FROM kappa_hub AS KH
            JOIN edge AS E ON E.edge_id = KH.edge_id
            JOIN process AS P ON P.process_id = KH.process_id
            WHERE E.run_id = %s
            ORDER BY 1,2;
            """
        df = read_sql(sql, engine, params=(run_id,),
                      index_col=['Vertex1', 'Vertex2', 'process']
                      ).unstack(level=-1).fillna(0)
        df = df['capacity']

    elif fname == 'kappa_process':
        # TODO test
        sql = """
            SELECT V.vertex_num AS "Vertex", P.process, KP.capacity
            FROM kappa_process AS KP
            JOIN vertex AS V ON V.vertex_id = KP.vertex_id
            JOIN process AS P ON P.process_id = KP.process_id
            WHERE V.run_id = %s
            ORDER BY 1,2;
            """
        df = read_sql(sql, engine, params=(run_id,),
                      index_col=['Vertex', 'process']
                      ).unstack(level=-1).fillna(0)
        df = df['capacity']

    elif fname in ['flow', 'hub', 'proc_io', 'proc_tau']:
        warnings.warn("<{}> is not impolemented yet."
                      "Returning an empty DataFrame".format(fname))
        df = DataFrame()
    else:
        warnings.warn("<{}> is un-known."
                      "Returning an empty DataFrame".format(fname))
        df = DataFrame()
    return df


def get_plot_dict(engine, run_id):
    string_query = """SELECT plot FROM RUN WHERE run_id = %s;"""

    connection = engine.raw_connection()
    plot_dict = {}
    try:
        with connection.cursor() as curs:
            curs.execute(string_query, (run_id, ))
            plot_dict = curs.fetchone()[0]
            connection.commit()
    finally:
        connection.close()
        return plot_dict