Source code for atra.transport_flow_and_failure_functions

"""Functions used in the provincial and national-scale network failure analysis
"""
import ast
import copy
import csv
import itertools
import math
import operator
import os
import sys

import json
import igraph as ig
import networkx as nx
from collections import defaultdict
from itertools import chain
import numpy as np
import pandas as pd
from atra.utils import *
from tqdm import tqdm

[docs]def spatial_scenario_selection(network_shapefile, 
                    polygon_dataframe, hazard_dictionary, 
                    data_dictionary,network_id_column,network_type ='nodes'):
    """Intersect network edges/nodes and boundary Polygons to collect boundary and hazard attributes

    Parameters
        - network_shapefile - Shapefile of edge LineStrings or node Points
        - polygon_shapefile - Shapefile of boundary Polygons
        - hazard_dictionary - Dictionary of hazard attributes
        - data_dictionary - Dictionary of network-hazard-boundary intersection attributes
        - network_type - String value -'edges' or 'nodes' - Default = 'nodes'
        - name_province - String name of province if needed - Default = ''

    Outputs
        data_dictionary - Dictionary of network-hazard-boundary intersection attributes:
            - edge_id/node_id - String name of intersecting edge ID or node ID
            - length - Float length of intersection of edge LineString and hazard Polygon: Only for edges
            - province_id - String/Integer ID of Province
            - province_name - String name of Province in English
            - district_id - String/Integer ID of District
            - district_name - String name of District in English
            - commune_id - String/Integer ID of Commune
            - commune_name - String name of Commune in English
            - hazard_attributes - Dictionary of all attributes from hazard dictionary
    """
    line_gpd = gpd.read_file(network_shapefile)
    poly_gpd = polygon_dataframe


    if len(line_gpd.index) > 0 and len(poly_gpd.index) > 0:
        print (network_shapefile,len(line_gpd.index),len(poly_gpd.index))
        line_gpd.columns = map(str.lower, line_gpd.columns)
        poly_gpd.columns = map(str.lower, poly_gpd.columns)

        # create spatial index
        poly_sindex = poly_gpd.sindex

        poly_sindex = poly_gpd.sindex
        for l_index, lines in line_gpd.iterrows():
            intersected_polys = poly_gpd.iloc[list(
                poly_sindex.intersection(lines.geometry.bounds))]
            for p_index, poly in intersected_polys.iterrows():
                if (lines['geometry'].intersects(poly['geometry']) is True) and (poly.geometry.is_valid is True) and (lines.geometry.is_valid is True):
                    if network_type == 'edges':
                        value_dictionary = {network_id_column: lines[network_id_column],
                                            'length': 1000.0*line_length(lines['geometry'].intersection(poly['geometry'])),
                                            'province_id': poly['province_id'], 'province_name': poly['province_name'],
                                            'department_id': poly['department_id'], 'department_name': poly['department_name']}
                    elif network_type == 'nodes':
                        value_dictionary = {network_id_column: lines[network_id_column],
                                            'province_id': poly['province_id'], 'province_name': poly['province_name'],
                                            'department_id': poly['department_id'], 'department_name': poly['department_name']}

                    data_dictionary.append({**value_dictionary, **hazard_dictionary})

    del line_gpd, poly_gpd
    return data_dictionary

[docs]def combine_hazards_and_network_attributes_and_impacts(hazard_dataframe, network_dataframe,network_id_column):
    hazard_dataframe.rename(columns={
        'length': 'exposure_length',
        'min_depth': 'min_flood_depth',
        'max_depth': 'max_flood_depth'
    }, inplace=True)

    network_dataframe.rename(columns={'length': 'edge_length'}, inplace=True)
    network_dataframe['edge_length'] = 1000.0*network_dataframe['edge_length']

    all_edge_fail_scenarios = pd.merge(hazard_dataframe, network_dataframe, on=[
        network_id_column], how='left').fillna(0)

    all_edge_fail_scenarios['percent_exposure'] = 100.0 * \
        all_edge_fail_scenarios['exposure_length']/all_edge_fail_scenarios['edge_length']

    del hazard_dataframe, network_dataframe

    return all_edge_fail_scenarios


[docs]def correct_exposures(x,length_thr):
    el = float(x.exposure_length)
    ep = float(x.percent_exposure)
    if ep > 100:
        el = 100.0*el/ep 
        ep = 100.0

    if el < length_thr:
        return el,ep, 1.0*el/length_thr
    else:
        return el,ep, 1.0

[docs]def change_depth_string_to_number(x):
    if 'cm' in x:
        return 0.01*float(x.split('cm')[0])
    elif 'm' in x:
        return 1.0*float(x.split('m')[0])
    else:
        return x


[docs]def create_hazard_scenarios_for_adaptation(all_edge_fail_scenarios, index_cols, length_thr):
    tqdm.pandas()
    all_edge_fail_scenarios['min_flood_depth'] = all_edge_fail_scenarios.min_flood_depth.progress_apply(
                                                lambda x:change_depth_string_to_number(x))
    all_edge_fail_scenarios['max_flood_depth'] = all_edge_fail_scenarios.max_flood_depth.progress_apply(
                                                lambda x:change_depth_string_to_number(x))
    min_height_prob = all_edge_fail_scenarios.groupby(index_cols)['min_flood_depth',
                                                        'probability'].min().reset_index()
    min_height_prob.rename(columns={'probability': 'min_probability'},inplace=True)
    max_height_prob = all_edge_fail_scenarios.groupby(index_cols)['max_flood_depth',
                                                        'probability'].max().reset_index()
    max_height_prob.rename(columns={'probability': 'max_probability'},inplace=True)
    min_max_height_prob = pd.merge(min_height_prob,max_height_prob,how='left',on=index_cols)
    del min_height_prob,max_height_prob
    prob_exposures = all_edge_fail_scenarios.groupby(index_cols + ['probability'])['percent_exposure',
                                                        'exposure_length'].sum().reset_index()
    del all_edge_fail_scenarios

    prob_exposures['exposures_risk'] = prob_exposures.progress_apply(lambda x: correct_exposures(x,length_thr),axis=1)
    prob_exposures[['exposure_length','percent_exposure','risk_wt']] = prob_exposures['exposures_risk'].apply(pd.Series)

    min_exposures = prob_exposures[index_cols + \
                    ['exposure_length',
                    'percent_exposure']].groupby(index_cols)['exposure_length',
                    'percent_exposure'].min().reset_index()
    min_exposures.rename(columns={'exposure_length':'min_exposure_length','percent_exposure':'min_exposure_percent'},inplace=True)
    max_exposures = prob_exposures[index_cols + \
                    ['exposure_length',
                    'percent_exposure']].groupby(index_cols)['exposure_length',
                    'percent_exposure'].max().reset_index()
    max_exposures.rename(columns={'exposure_length':'max_exposure_length','percent_exposure':'max_exposure_percent'},inplace=True)

    exposures = pd.merge(min_exposures,max_exposures,how='left',on=index_cols).fillna(0)
    del min_exposures,max_exposures
    height_prob_exposures = pd.merge(min_max_height_prob,exposures,how='left',on=index_cols).fillna(0)
    del min_max_height_prob, exposures

    prob_exposures = prob_exposures.set_index(index_cols)
    scenarios = list(set(prob_exposures.index.values.tolist()))
    t = len(scenarios)
    print('Number of failure scenarios',t)
    scenarios_list = []
    l = 0
    for sc in scenarios:
        l+= 1
        prob_tup = [tuple(x) for x in prob_exposures.loc[[sc], ['probability','exposure_length','risk_wt']].values.tolist()]
        if len(prob_tup) > 1:
            prob_tup = [(w,x,y) for (w,x,y) in sorted(prob_tup, key=lambda pair: pair[0])]
            risk_wt = 0
            dam_wt = 0
            for p in range(len(prob_tup)-1):
                risk_wt += 0.5*(prob_tup[p+1][0]-prob_tup[p][0])*(prob_tup[p+1][-1]+prob_tup[p][-1])
                dam_wt += 0.5*(prob_tup[p+1][0]-prob_tup[p][0])*(prob_tup[p+1][1]+prob_tup[p][1])

        else:
            risk_wt = prob_tup[0][0]*prob_tup[0][-1]
            dam_wt = prob_tup[0][0]*prob_tup[0][1]

        scenarios_list.append(list(sc) + [risk_wt, dam_wt])

        print ('Done with scenario {} out of {}'.format(l,t))
    
    new_cols = ['risk_wt', 'dam_wt']
    scenarios_df = pd.DataFrame(scenarios_list, columns=index_cols + new_cols)

    scenarios_df = pd.merge(scenarios_df,height_prob_exposures,how='left',on=index_cols).fillna(0)
    del scenarios_list,height_prob_exposures
    return scenarios_df

[docs]def swap_min_max(x, min_col, max_col):
    """Swap columns if necessary
    """
    if x[min_col] < 0 and x[max_col] < 0:
        if abs(x[min_col]) > abs(x[max_col]):
            return x[max_col], x[min_col]
        else:
            return x[min_col], x[max_col]
    else:
        if x[min_col] > x[max_col]:
            return x[max_col], x[min_col]
        else:
            return x[min_col], x[max_col]

[docs]def add_igraph_generalised_costs(G, vehicle_numbers, tonnage):
    # G.es['max_cost'] = list(cost_param*(np.array(G.es['length'])/np.array(G.es['max_speed'])))
    # G.es['min_cost'] = list(cost_param*(np.array(G.es['length'])/np.array(G.es['min_speed'])))
    # print (G.es['max_time'])
    G.es['max_gcost'] = list(

            vehicle_numbers * np.array(G.es['max_time_cost'])
            + tonnage * np.array(G.es['max_tariff_cost'])
    )
    G.es['min_gcost'] = list(
            vehicle_numbers * np.array(G.es['min_time_cost'])
            + tonnage * np.array(G.es['min_tariff_cost'])
    )

    return G

[docs]def add_dataframe_generalised_costs(G, vehicle_numbers, tonnage):
    # G.es['max_cost'] = list(cost_param*(np.array(G.es['length'])/np.array(G.es['max_speed'])))
    # G.es['min_cost'] = list(cost_param*(np.array(G.es['length'])/np.array(G.es['min_speed'])))
    # print (G.es['max_time'])
    G['max_gcost'] = list(

            vehicle_numbers * np.array(G['max_time_cost'])
            + tonnage * np.array(G['max_tariff_cost'])
    )
    G['min_gcost'] = list(
            vehicle_numbers * np.array(G['min_time_cost'])
            + tonnage * np.array(G['min_tariff_cost'])
    )

    return G

[docs]def network_od_path_estimations(graph,
    source, target, cost_criteria, time_criteria):
    """Estimate the paths, distances, times, and costs for given OD pair

    Parameters
    ---------
    graph
        igraph network structure
    source
        String/Float/Integer name of Origin node ID
    source
        String/Float/Integer name of Destination node ID
    tonnage : float
        value of tonnage
    vehicle_weight : float
        unit weight of vehicle
    cost_criteria : str
        name of generalised cost criteria to be used: min_gcost or max_gcost
    time_criteria : str
        name of time criteria to be used: min_time or max_time
    fixed_cost : bool

    Returns
    -------
    edge_path_list : list[list]
        nested lists of Strings/Floats/Integers of edge ID's in routes
    path_dist_list : list[float]
        estimated distances of routes
    path_time_list : list[float]
        estimated times of routes
    path_gcost_list : list[float]
        estimated generalised costs of routes

    """
    paths = graph.get_shortest_paths(source, target, weights=cost_criteria, output="epath")

    edge_path_list = []
    path_dist_list = []
    path_time_list = []
    path_gcost_list = []

    for path in paths:
        edge_path = []
        path_dist = 0
        path_time = 0
        path_gcost = 0
        if path:
            for n in path:
                edge_path.append(graph.es[n]['edge_id'])
                path_dist += graph.es[n]['length']
                path_time += graph.es[n][time_criteria]
                path_gcost += graph.es[n][cost_criteria]

        edge_path_list.append(edge_path)
        path_dist_list.append(path_dist)
        path_time_list.append(path_time)
        path_gcost_list.append(path_gcost)

    return edge_path_list, path_dist_list, path_time_list, path_gcost_list

[docs]def write_flow_paths_to_network_files(save_paths_df,
    min_industry_columns,
    max_industry_columns,
    gdf_edges, save_csv=True, save_shapes=True, shape_output_path='',csv_output_path=''):
    """Write results to Shapefiles

    Outputs ``gdf_edges`` - a shapefile with minimum and maximum tonnage flows of all
    commodities/industries for each edge of network.

    Parameters
    ---------
    save_paths_df
        Pandas DataFrame of OD flow paths and their tonnages
    industry_columns
        List of string names of all OD commodities/industries indentified
    min_max_exist
        List of string names of commodity/industry columns for which min-max tonnage column names already exist
    gdf_edges
        GeoDataFrame of network edge set
    save_csv
        Boolean condition to tell code to save created edge csv file
    save_shapes
        Boolean condition to tell code to save created edge shapefile
    shape_output_path
        Path where the output shapefile will be stored
    csv_output_path
        Path where the output csv file will be stored

    """
    edge_min_path_index = defaultdict(list)
    edge_max_path_index = defaultdict(list)
    for row in save_paths_df.itertuples():
        for item in row.min_edge_path:
            edge_min_path_index[item].append(row.Index)
        for item in row.max_edge_path:
            edge_max_path_index[item].append(row.Index)

    edge_flows_min = []
    edge_flows_max = []
    for vals in edge_min_path_index.keys():
        edge_flows = pd.DataFrame(list(zip([vals]*len(edge_min_path_index[vals]),edge_min_path_index[vals])),columns=['edge_id','path_index']).set_index('path_index')
        edge_flows = edge_flows.join(save_paths_df, how='left').fillna(0)
        edge_flows_min.append(edge_flows[['edge_id'] + min_industry_columns].groupby('edge_id')[min_industry_columns].sum().reset_index())
        print ('Done with edge {} for min'.format(vals))

    for vals in edge_max_path_index.keys():
        edge_flows = pd.DataFrame(list(zip([vals]*len(edge_max_path_index[vals]),edge_max_path_index[vals])),columns=['edge_id','path_index']).set_index('path_index')
        edge_flows = edge_flows.join(save_paths_df, how='left').fillna(0)
        edge_flows_max.append(edge_flows[['edge_id'] + max_industry_columns].groupby('edge_id')[max_industry_columns].sum().reset_index())
        print ('Done with edge {} for max'.format(vals))

    if len(edge_flows_min) == 1:
        edge_flows_min = edge_flows_min[0]
    elif len(edge_flows_min) > 1:
        edge_flows_min = pd.concat(edge_flows_min,axis=0,sort='False', ignore_index=True).groupby('edge_id')[min_industry_columns].sum().reset_index()

    # print (edge_flows_min)

    if len(edge_flows_max) == 1:
        edge_flows_max = edge_flows_max[0]
    elif len(edge_flows_max) > 1:
        edge_flows_max = pd.concat(edge_flows_max,axis=0,sort='False', ignore_index=True).groupby('edge_id')[max_industry_columns].sum().reset_index()

    # print (edge_flows_max)
    if min_industry_columns == max_industry_columns:
        for ind in min_industry_columns:
            edge_flows_min.rename(columns={ind:'min_'+ind},inplace=True)
            edge_flows_max.rename(columns={ind:'max_'+ind},inplace=True)

    edge_flows = pd.merge(edge_flows_min,edge_flows_max,how='left',on=['edge_id']).fillna(0)
    tqdm.pandas()
    if min_industry_columns == max_industry_columns:
        industry_columns = min_industry_columns
    else:
        industry_columns = [x[4:] for x in min_industry_columns]

    for ind in industry_columns:
        edge_flows['swap'] = edge_flows.progress_apply(lambda x: swap_min_max(x,'min_{}'.format(ind),'max_{}'.format(ind)), axis = 1)
        edge_flows[['min_{}'.format(ind),'max_{}'.format(ind)]] = edge_flows['swap'].apply(pd.Series)
        edge_flows.drop('swap', axis=1, inplace=True)

    gdf_edges = pd.merge(gdf_edges,edge_flows,how='left',on=['edge_id']).fillna(0)

    if save_shapes == True:
        gdf_edges.to_file(shape_output_path,encoding='utf-8')

    if save_csv == True:
        gdf_edges.drop('geometry', axis=1, inplace=True)
        gdf_edges.to_csv(csv_output_path,index=False,encoding='utf-8-sig')


    del gdf_edges, save_paths_df

[docs]def get_flow_paths_indexes_of_edges(flow_dataframe,path_criteria):
    tqdm.pandas()
    flow_dataframe[path_criteria] = flow_dataframe.progress_apply(lambda x:ast.literal_eval(x[path_criteria]),axis=1)
    edge_path_index = defaultdict(list)
    for k,v in zip(chain.from_iterable(flow_dataframe[path_criteria].ravel()), flow_dataframe.index.repeat(flow_dataframe[path_criteria].str.len()).tolist()):
        edge_path_index[k].append(v)

    del flow_dataframe
    return edge_path_index


[docs]def igraph_scenario_edge_failures_new(network_df_in, edge_failure_set,
    flow_dataframe,edge_flow_path_indexes, path_criteria,
    tons_criteria, cost_criteria, time_criteria,transport_mode,new_path = True):
    """Estimate network impacts of each failures
    When the tariff costs of each path are fixed by vehicle weight

    Parameters
    ---------
    network_df_in - Pandas DataFrame of network
    edge_failure_set - List of string edge ID's
    flow_dataframe - Pandas DataFrame of list of edge paths
    path_criteria - String name of column of edge paths in flow dataframe
    tons_criteria - String name of column of path tons in flow dataframe
    cost_criteria - String name of column of path costs in flow dataframe
    time_criteria - String name of column of path travel time in flow dataframe


    Returns
    -------
    edge_failure_dictionary : list[dict]
        With attributes
        edge_id - String name or list of failed edges
        origin - String node ID of Origin of disrupted OD flow
        destination - String node ID of Destination of disrupted OD flow
        no_access - Boolean 1 (no reroutng) or 0 (rerouting)
        new_cost - Float value of estimated cost of OD journey after disruption
        new_distance - Float value of estimated distance of OD journey after disruption
        new_path - List of string edge ID's of estimated new route of OD journey after disruption
        new_time - Float value of estimated time of OD journey after disruption
    """
    edge_fail_dictionary = []
    # network_df,edge_path_index = identify_all_failure_paths(network_df_in,edge_failure_set,flow_dataframe,path_criteria)

    edge_path_index = list(set(list(chain.from_iterable([path_idx for path_key,path_idx in edge_flow_path_indexes.items() if path_key in edge_failure_set]))))

    if edge_path_index:
        select_flows = flow_dataframe[flow_dataframe.index.isin(edge_path_index)]
        del edge_path_index
        network_graph = ig.Graph.TupleList(network_df_in[~network_df_in['edge_id'].isin(edge_failure_set)].itertuples(
            index=False), edge_attrs=list(network_df_in.columns)[2:])

        first_edge_id = edge_failure_set[0]
        del edge_failure_set
        A = sorted(network_graph.clusters().subgraphs(),key=lambda l:len(l.es['edge_id']),reverse=True)
        access_flows = []
        edge_fail_dictionary = []
        for i in range(len(A)):
            network_graph = A[i]
            nodes_name = np.asarray([x['name'] for x in network_graph.vs])
            po_access = select_flows[(select_flows['origin_id'].isin(nodes_name)) & (
                    select_flows['destination_id'].isin(nodes_name))]

            if len(po_access.index) > 0:
                po_access = po_access.set_index('origin_id')
                origins = list(set(po_access.index.values.tolist()))
                for o in range(len(origins)):
                    origin = origins[o]
                    destinations = po_access.loc[[origin], 'destination_id'].values.tolist()
                    tons = po_access.loc[[origin], tons_criteria].values.tolist()
                    paths = network_graph.get_shortest_paths(
                        origin, destinations, weights=cost_criteria, output="epath")
                    if new_path == True:
                        for p in range(len(paths)):
                            new_dist = 0
                            new_time = 0
                            new_gcost = 0
                            new_path = []
                            for n in paths[p]:
                                new_dist += network_graph.es[n]['length']
                                new_time += network_graph.es[n][time_criteria]
                                new_gcost += network_graph.es[n][cost_criteria]
                                new_path.append(network_graph.es[n]['edge_id'])
                            edge_fail_dictionary.append({'edge_id': first_edge_id, 'origin_id': origin, 'destination_id': destinations[p],
                                                         'new_path':new_path,'new_distance': new_dist, 'new_time': new_time,
                                                         'new_cost': tons[p]*new_gcost, 'no_access': 0})
                    else:
                        for p in range(len(paths)):
                            new_dist = 0
                            new_time = 0
                            new_gcost = 0
                            for n in paths[p]:
                                new_dist += network_graph.es[n]['length']
                                new_time += network_graph.es[n][time_criteria]
                                new_gcost += network_graph.es[n][cost_criteria]
                            edge_fail_dictionary.append({'edge_id': first_edge_id, 'origin_id': origin, 'destination_id': destinations[p],
                                                         'new_path':[],'new_distance': new_dist, 'new_time': new_time,
                                                         'new_cost': tons[p]*new_gcost, 'no_access': 0})
                    del destinations, tons, paths
                del origins
                po_access = po_access.reset_index()
                po_access['access'] = 1
                access_flows.append(po_access[['origin_id','destination_id','access']])
            del po_access

        del A

        if len(access_flows):
            access_flows = pd.concat(access_flows,axis=0,sort='False', ignore_index=True)
            select_flows = pd.merge(select_flows,access_flows,how='left',on=['origin_id','destination_id']).fillna(0)
        else:
            select_flows['access'] = 0

        no_access = select_flows[select_flows['access'] == 0]
        if len(no_access.index) > 0:
            for value in no_access.itertuples():
                edge_fail_dictionary.append({'edge_id': first_edge_id, 'origin_id': getattr(value,'origin_id'),
                                            'destination_id': getattr(value,'destination_id'),
                                            'new_path':[],'new_distance': 0, 'new_time': 0, 'new_cost': 0, 'no_access': 1})

        del no_access, select_flows

    return edge_fail_dictionary


[docs]def rearrange_minmax_values(edge_failure_dataframe):
    """Write results to Shapefiles

    Parameters
    ---------
    edge_failure_dataframe : pandas.DataFrame
        with min-max columns

    Returns
    -------
    edge_failure_dataframe : pandas.DataFrame
        With columns where min < max
    """
    failure_columns = edge_failure_dataframe.columns.values.tolist()
    failure_columns = [f for f in failure_columns if f != ('edge_id','no_access')]

    industry_columns = list(set([f.split('min_')[1] for f in failure_columns if 'min' in f]))

    for ind in industry_columns:
        edge_failure_dataframe['swap'] = edge_failure_dataframe.apply(lambda x: swap_min_max(
            x, 'min_{}'.format(ind), 'max_{}'.format(ind)), axis=1)
        edge_failure_dataframe[['min_{}'.format(ind), 'max_{}'.format(ind)]
                  ] = edge_failure_dataframe['swap'].apply(pd.Series)
        edge_failure_dataframe.drop('swap', axis=1, inplace=True)

    return edge_failure_dataframe

[docs]def network_failure_assembly_shapefiles(edge_failure_dataframe, gdf_edges, save_edges=True, shape_output_path=''):
    """Write results to Shapefiles


    Outputs gdf_edges - a Shapefile with results of edge failure dataframe

    Parameters
    ---------
    edge_failure_dataframe
        Pandas DataFrame of edge failure results
    gdf_edges
        GeoDataFrame of network edge set with edge ID's and geometry
    save_edges : bool
        Boolean condition to tell code to save created edge shapefile
    shape_output_path : str
        Path where the output shapefile will be stored

    """
    failure_columns = edge_failure_dataframe.columns.values.tolist()
    failure_columns = [f for f in failure_columns if f != 'edge_id']

    for fc in failure_columns:
        gdf_edges[fc] = 0

    for iter_, row in edge_failure_dataframe.iterrows():
        # print (row[1:])
        gdf_edges.loc[gdf_edges['edge_id'] == row['edge_id'],
                      failure_columns] = row[failure_columns].values


    industry_columns = list(set([f.split('min_')[1] for f in failure_columns if 'min' in f]))

    for ind in industry_columns:
        gdf_edges['swap'] = gdf_edges.apply(lambda x: swap_min_max(
            x, 'min_{}'.format(ind), 'max_{}'.format(ind)), axis=1)
        gdf_edges[['min_{}'.format(ind), 'max_{}'.format(ind)]
                  ] = gdf_edges['swap'].apply(pd.Series)
        gdf_edges.drop('swap', axis=1, inplace=True)

    if save_edges == True:
        gdf_edges.to_file(shape_output_path)

    del gdf_edges, edge_failure_dataframe

[docs]def edge_failure_sampling(failure_scenarios,edge_column):
    """Criteria for selecting failure samples

    Parameters
    ---------
    failure_scenarios - Pandas DataFrame of failure scenarios
    edge_column - String name of column to select failed edge ID's

    Returns
    -------
    edge_failure_samples - List of lists of failed edge sets
    """
    edge_failure_samples = list(set(failure_scenarios[edge_column].values.tolist()))

    return edge_failure_samples

[docs]def merge_failure_results(flow_df_select,failure_df,id_col,tons_col,dist_col,time_col,cost_col):
    """Merge failure results with flow results

    Parameters
    ---------
    flow_df_select : pandas.DataFrame
        edge flow values
    failure_df : pandas.DataFrame
        edge failure values
    tons_col : str
        name of column of tonnages in flow dataframe
    dist_col : str
        name of column of distance in flow dataframe
    time_col : str
        name of column of time in flow dataframe
    cost_col : str
        name of column of cost in flow dataframe
    vehicle_col : str
        name of column of vehicle counts in flow dataframe
    changing_tonnages : bool

    Returns
    -------
    flow_df_select : pandas.DataFrame
        Of edge flow and failure values merged
    """
    flow_df_select = pd.merge(flow_df_select, failure_df, on=[
                              'origin_id', 'destination_id'], how='left').fillna(0)
    flow_df_select = flow_df_select[(flow_df_select[tons_col] > 0) & (flow_df_select[id_col] != 0)]

    flow_df_select['dist_diff'] = (1 - flow_df_select['no_access'])*(flow_df_select['new_distance'] - flow_df_select[dist_col])
    flow_df_select['time_diff'] = (1 - flow_df_select['no_access'])*(flow_df_select['new_time'] - flow_df_select[time_col])
    flow_df_select['tr_loss'] = (1 - flow_df_select['no_access']) * (flow_df_select['new_cost'] - flow_df_select[cost_col])

    return flow_df_select
Source code for atra.transport_flow_and_failure_functions

Argentina Transport Risk Analysis

Navigation

Related Topics