## Importing Libraries
import pandas as pd
import plotly.graph_objects as go
import plotly.express as px
from IPython.display import display
import ipywidgets as widgets
import pandas as pd
import numpy as np
import matplotlib as mpl # optional (here)
import matplotlib.pyplot as plt
import seaborn # Optional, will only affect the color of bars and the grid
from ipywidgets import widgets, interactive
from ipywidgets import interact, Checkbox, FloatRangeSlider, VBox, HBox
import plotly.graph_objs as go
from plotly.offline import iplot
import plotly.io as pio


import plotly.io as pio
pio.renderers.default = 'notebook_connected'

# In your Jupyter Notebook, run the following command to get the required javascript files:
pio.templates.default = "plotly"
pio.templates[pio.templates.default].layout.update({
    'autosize': True,
    'height': 550,
    'width': 1000,
})

Layout({
    'annotationdefaults': {'arrowcolor': '#2a3f5f', 'arrowhead': 0, 'arrowwidth': 1},
    'autosize': True,
    'autotypenumbers': 'strict',
    'coloraxis': {'colorbar': {'outlinewidth': 0, 'ticks': ''}},
    'colorscale': {'diverging': [[0, '#8e0152'], [0.1, '#c51b7d'], [0.2,
                                 '#de77ae'], [0.3, '#f1b6da'], [0.4, '#fde0ef'],
                                 [0.5, '#f7f7f7'], [0.6, '#e6f5d0'], [0.7,
                                 '#b8e186'], [0.8, '#7fbc41'], [0.9, '#4d9221'],
                                 [1, '#276419']],
                   'sequential': [[0.0, '#0d0887'], [0.1111111111111111,
                                  '#46039f'], [0.2222222222222222, '#7201a8'],
                                  [0.3333333333333333, '#9c179e'],
                                  [0.4444444444444444, '#bd3786'],
                                  [0.5555555555555556, '#d8576b'],
                                  [0.6666666666666666, '#ed7953'],
                                  [0.7777777777777778, '#fb9f3a'],
                                  [0.8888888888888888, '#fdca26'], [1.0,
                                  '#f0f921']],
                   'sequentialminus': [[0.0, '#0d0887'], [0.1111111111111111,
                                       '#46039f'], [0.2222222222222222, '#7201a8'],
                                       [0.3333333333333333, '#9c179e'],
                                       [0.4444444444444444, '#bd3786'],
                                       [0.5555555555555556, '#d8576b'],
                                       [0.6666666666666666, '#ed7953'],
                                       [0.7777777777777778, '#fb9f3a'],
                                       [0.8888888888888888, '#fdca26'], [1.0,
                                       '#f0f921']]},
    'colorway': [#636efa, #EF553B, #00cc96, #ab63fa, #FFA15A, #19d3f3, #FF6692,
                 #B6E880, #FF97FF, #FECB52],
    'font': {'color': '#2a3f5f'},
    'geo': {'bgcolor': 'white',
            'lakecolor': 'white',
            'landcolor': '#E5ECF6',
            'showlakes': True,
            'showland': True,
            'subunitcolor': 'white'},
    'height': 550,
    'hoverlabel': {'align': 'left'},
    'hovermode': 'closest',
    'mapbox': {'style': 'light'},
    'paper_bgcolor': 'white',
    'plot_bgcolor': '#E5ECF6',
    'polar': {'angularaxis': {'gridcolor': 'white', 'linecolor': 'white', 'ticks': ''},
              'bgcolor': '#E5ECF6',
              'radialaxis': {'gridcolor': 'white', 'linecolor': 'white', 'ticks': ''}},
    'scene': {'xaxis': {'backgroundcolor': '#E5ECF6',
                        'gridcolor': 'white',
                        'gridwidth': 2,
                        'linecolor': 'white',
                        'showbackground': True,
                        'ticks': '',
                        'zerolinecolor': 'white'},
              'yaxis': {'backgroundcolor': '#E5ECF6',
                        'gridcolor': 'white',
                        'gridwidth': 2,
                        'linecolor': 'white',
                        'showbackground': True,
                        'ticks': '',
                        'zerolinecolor': 'white'},
              'zaxis': {'backgroundcolor': '#E5ECF6',
                        'gridcolor': 'white',
                        'gridwidth': 2,
                        'linecolor': 'white',
                        'showbackground': True,
                        'ticks': '',
                        'zerolinecolor': 'white'}},
    'shapedefaults': {'line': {'color': '#2a3f5f'}},
    'ternary': {'aaxis': {'gridcolor': 'white', 'linecolor': 'white', 'ticks': ''},
                'baxis': {'gridcolor': 'white', 'linecolor': 'white', 'ticks': ''},
                'bgcolor': '#E5ECF6',
                'caxis': {'gridcolor': 'white', 'linecolor': 'white', 'ticks': ''}},
    'title': {'x': 0.05},
    'width': 1000,
    'xaxis': {'automargin': True,
              'gridcolor': 'white',
              'linecolor': 'white',
              'ticks': '',
              'title': {'standoff': 15},
              'zerolinecolor': 'white',
              'zerolinewidth': 2},
    'yaxis': {'automargin': True,
              'gridcolor': 'white',
              'linecolor': 'white',
              'ticks': '',
              'title': {'standoff': 15},
              'zerolinecolor': 'white',
              'zerolinewidth': 2}
})


from IPython.display import HTML
HTML('''<button type="button" class="btn btn-outline-danger"  onclick="codeToggle();">Toggle Code</button>''')


import warnings
warnings.filterwarnings('ignore')


## Data Preprocessing
poverty_data = pd.read_csv('poverty.csv')
loc = pd.read_csv('ISO.csv')

# Drop unnecessary columns from the ISO dataset
loc = loc.drop(['Alpha-2 code', 'ISO 3166-2', 'Numeric code'], axis=1)
# Renaming country column to help with merging later
loc = loc.rename(columns={'English short name lower case': 'country'})

# Renaming country column to help with merging later
poverty_data = poverty_data.rename(columns={'region': 'country', 'atk5': 'Atkinson_Coefficient_(epsilon=0.5)', 'd9010': 'Percentile_Ratio_(90/10)', 
                                            'poorAll6': 'Relative_Poverty_Rates_Total_Population_60%', 
                                            'poortp': 'Children_Poverty_Rates_Two_Parent_Families_50%', 
                                            'poorsm': 'Children_Poverty_Rates_Single_Mother_Families_50%',
                                            'pkidsm': '%_Children_Living_in_Single_Mother_Families', 'eymed': 'Median_Equivalized_Income',
                                            'average': 'Mean_Equivalized_Income'})
# Selecting only the columns we want to keep
poverty_data = poverty_data.loc[:, ['country', 'year', 'gini', 'Atkinson_Coefficient_(epsilon=0.5)', 'Percentile_Ratio_(90/10)',
                                    'Relative_Poverty_Rates_Total_Population_60%', 'Children_Poverty_Rates_Two_Parent_Families_50%',
                                    'Children_Poverty_Rates_Single_Mother_Families_50%', '%_Children_Living_in_Single_Mother_Families',
                                    'Median_Equivalized_Income', 'Mean_Equivalized_Income']]

# Adding some corrections in the names of countries
corrections = {'Czech Rebuplic': 'Czech Republic', 'Cote D Ivoire': "Côte d'Ivoire", 'Palestine': 'Palestinian Territory, Occupied', 
               'South Korea': 'Korea, Republic of (South Korea)', 'United States': 'United States Of America'}
poverty_data['country'] = poverty_data['country'].replace(corrections)

# Merge the two dataframes
data = poverty_data.merge(loc, on='country')
data.to_csv('data.csv', index = False)


import plotly.graph_objs as go
import pandas as pd

# Read in the data
data = pd.read_csv('data.csv')

f_data = data.dropna()
# Group the data by year
grouped_data = f_data.groupby('year')

# Find the row with the highest Gini coefficient for each year
highest_gini_by_year = grouped_data.apply(lambda x: x.loc[x['gini'].idxmax()])

# Filter the data for every 4th year
filtered_data = highest_gini_by_year[highest_gini_by_year['year'] % 4 == 0]

# Create a scatter plot

scatter = go.Scatter(x=filtered_data['year'], y=filtered_data['gini'], mode='markers+text',
                     text=filtered_data['country'], textposition='bottom center')
fig.add_trace(scatter)

# Set the title and axis labels
layout = go.Layout(title='Highest Gini Coefficients by Year (in gaps of 4 years)',
                  xaxis_title='Year', yaxis_title='Gini Coefficient')

fig = go.Figure(data = scatter, layout = layout)
iplot(fig)


## Plotting gini index over time
map_data = data[data.year>1970][["country", "year", "gini", "Alpha-3 code", "Atkinson_Coefficient_(epsilon=0.5)", "Percentile_Ratio_(90/10)",
                                  "Relative_Poverty_Rates_Total_Population_60%", "Children_Poverty_Rates_Two_Parent_Families_50%", 
                                  "Children_Poverty_Rates_Single_Mother_Families_50%", "%_Children_Living_in_Single_Mother_Families", 
                                  "Median_Equivalized_Income", "Mean_Equivalized_Income"]].dropna()

# Minimum and max vaue of year
min_year = map_data.year.min()
max_year = map_data.year.max()

# Fill in missing years for all countries with Alpha-3 code as the same and all other values as 0
for year in range(min_year, max_year+1):
    for country in map_data.country.unique():
        if year not in map_data[map_data.country == country].year.values:
            map_data = map_data.append({'country': country, 'year': year, 'gini': 0, "Atkinson_Coefficient_(epsilon=0.5)": 0,
                                         "Percentile_Ratio_(90/10)": 0, "Relative_Poverty_Rates_Total_Population_60%": 0, 
                                         "Children_Poverty_Rates_Two_Parent_Families_50%": 0, "Children_Poverty_Rates_Single_Mother_Families_50%": 0, 
                                         "%_Children_Living_in_Single_Mother_Families": 0, "Median_Equivalized_Income": 0, 
                                         "Mean_Equivalized_Income": 0, 'Alpha-3 code': map_data[map_data.country == country]['Alpha-3 code'].values[0]}, ignore_index=True)

# Sort the dataframe by country and year
map_data = map_data.sort_values(["country", "year"]).reset_index(drop=True)
fig = px.scatter_geo(map_data, locations = 'Alpha-3 code', color = "country", hover_name = "country", size = "gini", 
                     projection = "natural earth", animation_frame="year", template = "plotly_dark", title = "Gini index of countries over time",
                     hover_data=["Atkinson_Coefficient_(epsilon=0.5)", "Percentile_Ratio_(90/10)", "Relative_Poverty_Rates_Total_Population_60%",
                                    "Children_Poverty_Rates_Two_Parent_Families_50%", "Children_Poverty_Rates_Single_Mother_Families_50%",
                                    "%_Children_Living_in_Single_Mother_Families", "Median_Equivalized_Income", "Mean_Equivalized_Income"])
fig.show()


## Timeline of Gini Index of Countries
# List of countries to be plotted
countries = ['United States of America', 'United Kingdom', 'Austria', 'Russia', 'China', 'Germany', 'Australia', 'India', 'South Africa']

# Plotting the graph
fig = px.line(title="Gini Index of Countries over time", template="plotly_dark")

for country in countries:
    fig_data = data[(data.country == country) & (data.year >= 1990)][['year', 'gini']]
    fig.add_trace(go.Scatter(x=fig_data['year'], y=fig_data['gini'], name=country, mode='lines'))
    fig.update_layout(xaxis_title="Year", yaxis_title="Gini Index")

fig.show()


## Plots for different poverty rates
countries = ['Japan', 'Russia', 'India']

for country in countries:
    # fig2_data = data[(data.country == country) & (data.year >= 0)][['year', 'gini']]
    # print(fig2_data)
    fig2 = px.line(title = country, template="plotly_dark")
    fig2_data = data[(data.country == country) & (data.year >= 1990)][['year', 'Relative_Poverty_Rates_Total_Population_60%',
                                                                       'Children_Poverty_Rates_Two_Parent_Families_50%',
                                                                       'Children_Poverty_Rates_Single_Mother_Families_50%',
                                                                       '%_Children_Living_in_Single_Mother_Families']]
    fig2.add_trace(go.Scatter(x=fig2_data['year'], y=fig2_data['Relative_Poverty_Rates_Total_Population_60%'], name='Relative_Poverty_Rates_Total_Population_60%', mode='lines'))
    fig2.add_trace(go.Scatter(x=fig2_data['year'], y=fig2_data['Children_Poverty_Rates_Two_Parent_Families_50%'], name='Children_Poverty_Rates_Two_Parent_Families_50%', mode='lines'))
    fig2.add_trace(go.Scatter(x=fig2_data['year'], y=fig2_data['Children_Poverty_Rates_Single_Mother_Families_50%'], name='Children_Poverty_Rates_Single_Mother_Families_50%', mode='lines'))
    fig2.add_trace(go.Scatter(x=fig2_data['year'], y=fig2_data['%_Children_Living_in_Single_Mother_Families'], name='%_Children_Living_in_Single_Mother_Families', mode='lines'))
    fig2.update_layout(xaxis_title="Year", yaxis_title="Percentage")

    fig2.show()


## Plots for different income 
countries = ['Japan', 'Russia', 'India']

for country in countries:
    # fig2_data = data[(data.country == country) & (data.year >= 0)][['year', 'gini']]
    # print(fig2_data)
    fig2 = px.line(title = country, template="plotly_dark")
    fig2_data = data[(data.country == country) & (data.year >= 1990)][['year', 'Median_Equivalized_Income',
                                                                          'Mean_Equivalized_Income']]
    fig2.add_trace(go.Scatter(x=fig2_data['year'], y=fig2_data['Median_Equivalized_Income'], name='Median_Equivalized_Income', mode='lines'))
    fig2.add_trace(go.Scatter(x=fig2_data['year'], y=fig2_data['Mean_Equivalized_Income'], name='Mean_Equivalized_Income', mode='lines'))
    fig2.update_layout(xaxis_title="Year", yaxis_title="Income in country's currency")

    fig2.show()


import matplotlib.pyplot as plt
import ipywidgets
import pandas as pd
seaborn.set() 
# Define the countries and their corresponding data files
countries = ["India", "Korea", "Singapore", "Switzerland"]
file_names = [f".\created_data\{c}.csv" for c in countries]

# Load the data for each country into a list of dataframes
list_df = [pd.read_csv(f) for f in file_names]

# Define the plot function for the interactive widget
def plot(value,Var):
    count = 0
    plt.figure(figsize=(10, 6)) 
    plt.grid()
    for df in list_df:
        # Select the data for the specified percentile and variable
        df1 = df[df["variable"] == Var]
        dfg = df1[df1["percentile"] == value]
        if(len(dfg)==0):
            pass
        else:
            # Plot the data for the current country
            li2 = list(dfg["shorttype"].unique())
            df3 = dfg[dfg['shorttype']==li2[0]]
            li3 = list(df3["pop"].unique())
            df4 = df3[df3['pop']==li3[0]]
            li4 = list(df4["pop"].unique())
            df5 = df4[df4['pop']==li4[0]]
            plt.plot(df4['year'], df4['value'], label = countries[count] )
            plt.legend()
        count += 1

    # Add axis labels and a title
    plt.xlabel('Year')
    plt.ylabel(Var)
    plt.title(str(Var))

    # Display the plot
    plt.show()


ipywidgets.interact(plot, value=["p0p50", "p50p90", "p90p100", "p99.9p100", "p99.99p100", "p0p100", "p37p38", "p30p31"],Var = ["Net personal wealth", "Fiscal income "])

interactive(children=(Dropdown(description='value', options=('p0p50', 'p50p90', 'p90p100', 'p99.9p100', 'p99.9…

<function __main__.plot(value, Var)>


import geopandas as gpd
import matplotlib.pyplot as plt
import numpy as np
import ipywidgets

# Read in the shapefile of the world map
world = gpd.read_file(gpd.datasets.get_path('naturalearth_lowres'))

# Read in the CSV file with data to plot
data = gpd.read_file('MPI_national.csv')
data = data.rename(columns={'ISO' :'iso_a3' })

# Join the shapefile and data on a common column


def plot2(value):
    # Set missing values to NaN
    merged = world.merge(data, on='iso_a3', how='left')
    merged[value] = merged[value].astype(float)
    merged.loc[merged[value].isnull(), value] = np.nan

    # Plot the map, coloring by the desired column
    fig, ax = plt.subplots(figsize=(12, 6))
    merged = gpd.GeoDataFrame(merged)
    merged = merged.set_geometry('geometry_x')
    merged.plot(column=value, cmap='YlOrRd', legend=True, ax=ax)
    ax.set_title('Map colored by column')

    # Add a colorbar
    sm = plt.cm.ScalarMappable(cmap='YlOrRd', norm=plt.Normalize(vmin=merged[value].min(), vmax=merged[value].max()))
#     cbar = plt.colorbar(sm)

    #Show the plot
    plt.show()
va = ['MPI Urban','Headcount Ratio Urban','Intensity of Deprivation Urban','MPI Rural','Headcount Ratio Rural','Intensity of Deprivation Rural']
ipywidgets.interact(plot2, value=va )

interactive(children=(Dropdown(description='value', options=('MPI Urban', 'Headcount Ratio Urban', 'Intensity …

<function __main__.plot2(value)>


import ipywidgets
file_name = ".\created_data\India.csv"
df = pd.read_csv(file_name)


li = list(df["variable"].unique())
def plot(X_values, year):
    df2 = df[df['variable']== X_values ]
    li2 = list(df2["shorttype"].unique())
    def plot_y(y):
        df3 = df2[df2['shorttype']==y]
        li3 = list(df2["percentile"].unique())
        for z in li3:
            df4 = df3[df3['percentile']==z]
            li4 = list(df4["age"].unique())
            for r in li4:
                df5 = df4[df4['age']==r]
                li5 = list(df4["pop"].unique())
                plt.grid()
                for u in li5:
                    plt.plot(df5['year'], df5['value'], label = r)
                    plt.scatter(year, df5[df5['year']==year]['value'].iloc[0])
                    plt.legend

        # Add axis labels and a title
        plt.xlabel('Year')
        plt.ylabel(X_values)
        plt.title('India')

        # Display the plot
        plt.show()

    ipywidgets.interact(plot_y, y=li2)
ipywidgets.interact(plot, X_values = li, year = (1990,2020,1))

interactive(children=(Dropdown(description='X_values', options=('Personal carbon footprint  (investments only)…

<function __main__.plot(X_values, year)>


import ipywidgets
file_name = ".\created_data\Thailand.csv"
df = pd.read_csv(file_name)


li = list(df["variable"].unique())
def plot(X_values, year):
    df2 = df[df['variable']== X_values ]
    li2 = list(df2["shorttype"].unique())
    def plot_y(y):
        df3 = df2[df2['shorttype']==y]
        li3 = list(df2["percentile"].unique())
        for z in li3:
            df4 = df3[df3['percentile']==z]
            li4 = list(df4["age"].unique())
            for r in li4:
                df5 = df4[df4['age']==r]
                li5 = list(df4["pop"].unique())
                plt.grid()
                for u in li5:
                    plt.plot(df5['year'], df5['value'], label = r)
                    plt.scatter(year, df5[df5['year']==year]['value'].iloc[0])
                    plt.legend

        # Add axis labels and a title
        plt.xlabel('Year')
        plt.ylabel(X_values)
        plt.title('Thailand')

        # Display the plot
        plt.show()

    ipywidgets.interact(plot_y, y=li2)
ipywidgets.interact(plot, X_values = li, year = (1990,2020,1))

interactive(children=(Dropdown(description='X_values', options=('Personal carbon footprint  (investments only)…

<function __main__.plot(X_values, year)>


import ipywidgets
file_name = ".\created_data\Singapore.csv"
df = pd.read_csv(file_name)


li = list(df["variable"].unique())
def plot(X_values, year):
    df2 = df[df['variable']== X_values ]
    li2 = list(df2["shorttype"].unique())
    def plot_y(y):
        df3 = df2[df2['shorttype']==y]
        li3 = list(df2["percentile"].unique())
        for z in li3:
            df4 = df3[df3['percentile']==z]
            li4 = list(df4["age"].unique())
            for r in li4:
                df5 = df4[df4['age']==r]
                li5 = list(df4["pop"].unique())
                plt.grid()
                for u in li5:
                    plt.plot(df5['year'], df5['value'], label = r)
                    plt.scatter(year, df5[df5['year']==year]['value'].iloc[0])
                    plt.legend

        # Add axis labels and a title
        plt.xlabel('Year')
        plt.ylabel(X_values)
        plt.title('Singapore')

        # Display the plot
        plt.show()

    ipywidgets.interact(plot_y, y=li2)
ipywidgets.interact(plot, X_values = li, year = (1990,2020,1))

interactive(children=(Dropdown(description='X_values', options=('Household direct emissions  ', 'Personal carb…

<function __main__.plot(X_values, year)>


import matplotlib.pyplot as plt
import ipywidgets
import pandas as pd

countries = [" India", " Japan", " korea", " United Kingdom", " United states", " Canada", " Iraq"]

def plot(value, year):
    year_vals = []
    path = value + ".csv"
    df = pd.read_csv(path)
    for c in countries:
        df1 = df[df["Country"] == c]
        n = year - 1993
        m =len(df1.columns)
        if n<m: 
            val = df1.iloc[:, n]
        
            if(len(val)==0):
                val = 0
            else:
                val = val.iloc[0]
        else:
            val = 0
        year_vals.append(val)
    
    plt.figure(figsize=(10, 6))  # set the size of the plot
    plt.bar(countries, year_vals, color='skyblue')  # set the color of the bars
    plt.title(value + " in " + str(year))  # set the title of the plot
    plt.xlabel("Countries")  # set the x-axis label
    plt.ylabel("Values")  # set the y-axis label
    plt.xticks(rotation=45)  # rotate the x-axis labels for better readability
    plt.show() 

ipywidgets.interact(plot, value=["gender_inequality_index", "gender_development_index"],year = (1998,2011,1))

interactive(children=(Dropdown(description='value', options=('gender_inequality_index', 'gender_development_in…

<function __main__.plot(value, year)>


import geopandas as gpd
import matplotlib.pyplot as plt
import numpy as np
import pandas as pd
import ipywidgets

seaborn.set() 

def plot2(year):
    # Set missing values to NaN
    value = 'Proportion of seats held by women in national parliaments (%)'
    # Read in the shapefile of the world map
    world = gpd.read_file(gpd.datasets.get_path('naturalearth_lowres'))
    # Read in the CSV file with data to plot
    data = gpd.read_file('Viz5_August_Female_Political_Representation.csv')
    data = data.rename(columns={'Country Code' :'iso_a3' })
    data['Year'] = pd.to_numeric(data['Year'], errors='coerce')
    data[value] = pd.to_numeric(data[value], errors='coerce')
    data2 = data[data['Year'] == year]
    merged = world.merge(data2, on='iso_a3', how='left')
#     merged[value] = merged[value].astype(float)
    merged.loc[merged[value].isnull(), value] = np.nan
    # Plot the map, coloring by the desired column
    fig, ax = plt.subplots(figsize=(12, 6))
    merged = gpd.GeoDataFrame(merged)
    merged = merged.set_geometry('geometry_x')
    merged.plot(column=value, cmap='YlOrRd', legend=True, ax=ax)
    ax.set_title('Map colored by column')
    # Add a colorbar
    sm = plt.cm.ScalarMappable(cmap='YlOrRd', norm=plt.Normalize(vmin=merged[value].min(), vmax=merged[value].max()))

    #Show the plot
    plt.show()
    
ipywidgets.interact(plot2, year= (1997, 2019, 1))

interactive(children=(IntSlider(value=2008, description='year', max=2019, min=1997), Output()), _dom_classes=(…

<function __main__.plot2(year)>


import ipywidgets
file_name = "gender-wage-gap-oecd.csv"
df = pd.read_csv(file_name)
countries = ["Australia", "Japan", "United Kingdom", "Canada"]


def plot(co):
    df2 = df[df['Entity']== co ]
    plt.figure(figsize=(20, 10))
    plt.plot(df2['Year'], df2['Gender wage gap (OECD 2017)'], label = co )
    plt.legend

    # Add axis labels and a title
    plt.xlabel('Year')
    plt.ylabel('Gender wage gap')
    plt.title(co)

    # Display the plot
    plt.show()

ipywidgets.interact(plot, co = countries)

interactive(children=(Dropdown(description='co', options=('Australia', 'Japan', 'United Kingdom', 'Canada'), v…

<function __main__.plot(co)>


import pandas as pd
import matplotlib.pyplot as plt
import seaborn 
seaborn.set() 

# Read the CSV file into a pandas dataframe
path = 'top_female.csv'
df = pd.read_csv(path)[:-2]
sorted_df = df.sort_values(by=['Firms with female top manager (% of firms)'], ascending=False)
df = sorted_df.iloc[:-2]
li = list(df['Entity'])
li2 = list(df['Firms with female top manager (% of firms)'])
li3 = [17.68]*len(li2)
# Plot a bar graph
plt.figure(figsize=(20, 10))
plt.bar(li, li2, color='skyblue', width=0.8)
plt.title('Firms with female top manager (% of firms)')
plt.plot(li,li3,color='blue')
plt.xlabel('Countries')
plt.ylabel('Firms with female top manager (% of firms)')
plt.xticks(rotation=45, fontsize = '6')
plt.show()


import pandas as pd
import matplotlib.pyplot as plt
import seaborn 
seaborn.set() 

# Read the CSV file into a pandas dataframe
path = 'top_female.csv'
df = pd.read_csv(path)
df = df.iloc[:-2]
li = list(df['Entity'])
li2 = list(df['Firms with female top manager (% of firms)'])
li3 = [50]*len(li2)
# Plot a bar graph
plt.figure(figsize=(20, 10))
plt.scatter(li, li2, cmap='viridis')
plt.title('Firms with female top manager (% of firms)')
plt.plot(li,li3,color='blue')
plt.xlabel('Countries')
plt.ylabel('Firms with female top manager (% of firms)')
plt.gca().set_xticklabels([])
plt.show()


import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

sns.set() 

# Read the CSV file into a pandas dataframe

lir = ["United Kingdom", "Canada", "Argentina"]

def plot(con):
    path = 'WIID_06MAY2020.csv'
    df = pd.read_csv(path)
    df = df[df['country']==con]
    df = df.drop_duplicates(subset=['year'], keep='first')
    
    # Interpolate missing values
    df = df.set_index('year').interpolate().reset_index()
    
    plt.figure(figsize=(20, 10))
    plt.plot(df['year'], df['ratio_top20bottom20'] )
    plt.title('ratio_top20bottom20')
    plt.xlabel('Years')
    plt.ylabel('Ratio')
    plt.show()

ipywidgets.interact(plot, con = lir)

interactive(children=(Dropdown(description='con', options=('United Kingdom', 'Canada', 'Argentina'), value='Un…

<function __main__.plot(con)>

World Income Inequality and Poverty Analysis¶

Hypothesis¶

If the interactive plots are not visible:¶

Conclusion¶