# Import libraries
from matplotlib import pyplot as plt
import matplotlib.ticker as mtick
import numpy as np
%matplotlib inline


# This value for alpha is said to exemplify the 80/20 axiom
alpha = np.log(5)/np.log(4)
print("alpha=", alpha)

alpha= 1.160964047443681


# Set the graph limits
x_min = 1
x_max = 21


# Define Propability Density Function
def pareto_PDF(x, alpha):
    y = (alpha*(x_min**alpha))/(x**(alpha+1))
    return y


plt.figure(figsize=(8, 6))
ax = plt.subplot(111)
ax.set_xlim(left=1, right=(x_max/2))
#plt.grid(visible=True, which='both', axis='both', color='darkgrey', linestyle='-', linewidth=0.25)
plt.xticks(np.arange(0, ((x_max/2)+1), step=1), fontsize = 10)  # Set label locations.
plt.title("Pareto Distribution: Propability Density", color = "b")
# Plot linewise
x=np.linspace(x_min, (x_max/2) , num=1000)
y = pareto_PDF (x, alpha)
ax.plot(x, y, color='b', linewidth=2.0)
ax.set(yticklabels=[])
ax.set(xticklabels=[])    
plt.show()


# Source data
incomes = [150, 200, 300, 400, 500, 600, 700, 800, 900, 1000, 2000, 3000, 4000, 5000, 10000]
citizens = [400648, 234185, 121996, 74041, 54419, 42072, 34269, 29311, 25033, 22896, 9880, 6069, 4161, 3081, 1104]
# Prepare graph
fig, axs = plt.subplots(1, 2, sharey=False, figsize=(9,4))
fig.suptitle("1893/1894 Income (Great Britain)")
# Linear plot
axs[0].plot(incomes, citizens, 'o', color='r')
axs[0].plot(incomes, citizens, '-', color='g', alpha=0.6, linewidth=3)
axs[0].set_title("linear scale", color = "b")
axs[0].grid(visible=True, which='both', axis='both', color='darkgrey', linestyle='-', linewidth=0.25)
axs[0].set_xlabel("income", color='#999999')    
axs[0].set_ylabel("number of citizens", color='#999999')
# Log-log plot
axs[1].set_yscale('log')
axs[1].set_xscale('log')
axs[1].plot(incomes, citizens, 'o', color='r')
axs[1].plot(incomes, citizens, '-', color='g', alpha=0.6, linewidth=3)
axs[1].set_title("log-log scale", color = "b")
axs[1].grid(visible=True, which='both', axis='both', color='darkgrey', linestyle='-', linewidth=0.25)
axs[1].set_xlabel("income", color='#999999')      
axs[1].set_ylabel("number of citizens", color='#999999')
plt.show()


plt.figure(figsize=(8, 6))
ax = plt.subplot(111)
ax.set_xlim(left=1, right=(x_max/2))
ax.set_yscale('log')
ax.set_xscale('log')
plt.grid(visible=True, which='both', axis='both', color='darkgrey', linestyle='-', linewidth=0.25)
plt.title("Pareto Distribution: Log-Log", color = "b")
# Plot linewise
x=np.linspace(x_min, (x_max/2) , num=1000)
y = pareto_PDF (x, alpha)
ax.plot(x, y, color='b', linewidth=2.0)
ax.set(yticklabels=[])
ax.set(xticklabels=[])    
plt.show()


# Define Cumulative Distribution Function
def pareto_CDF(x, alpha):
    y = 1 - ((x_min/x)**(alpha))
    return y


plt.figure(figsize=(10, 6))
ax = plt.subplot(111)
ax.set_xlim(left=1, right=x_max)
plt.grid(visible=True, which='both', axis='both', color='darkgrey', linestyle='-', linewidth=0.25)
plt.xticks(np.arange(0, (x_max+1), step=1), fontsize = 10)  # Set label locations.
plt.title("Pareto Distribution: CDF", color = "b")
plt.xlabel("arbitrary units")
plt.axhline(y=0.8, linestyle=":", color='g')
plt.axvline(x=4, linestyle=":", color='r')
plt.axvline(x=20, linestyle=":", color='r')
ax.yaxis.set_major_formatter(mtick.PercentFormatter(1.0, None,'%'))
# Plot 
x=np.linspace(x_min, x_max , num=1000)
y = pareto_CDF (x, alpha)
ax.plot(x, y, color='b', linewidth=2.0)
plt.show()


print("4:  ", pareto_CDF (4, alpha))
print("20: ", pareto_CDF (20, alpha))

4:   0.8
20:  0.9691289820417199


plt.figure(figsize=(10, 6))
ax = plt.subplot(111)
ax.set_xlim(left=1, right=x_max)
plt.grid(visible=True, which='both', axis='both', color='darkgrey', linestyle='-', linewidth=0.25)
plt.xticks(np.arange(0, (x_max+1), step=1), fontsize = 10)  # Set label locations.
plt.title("Pareto Distribution: Shape Parameters", color = "b")
plt.xlabel("arbitrary units")
plt.axhline(y=0.8, linestyle=":", color='g')
plt.axvline(x=4, linestyle=":", color='r')
plt.axvline(x=20, linestyle=":", color='r')
ax.yaxis.set_major_formatter(mtick.PercentFormatter(1.0, None,'%'))
alphas_list = np.array([ 0.5, 0.75, 1.16, 2])
# Plot 
x=np.linspace(x_min, x_max , num=1000)
i=0
while i < len(alphas_list):
    y = pareto_CDF (x, alphas_list[i])
    ax.plot(x, y, label=('alpha='+str(alphas_list[i])))
    plt.legend()
    i=i+1
plt.show()


# Import normal distribution method
from scipy.stats import norm
mean, var, skew, kurt = norm.stats(moments='mvsk')

fig, axs = plt.subplots(2, 2, sharey=True, figsize=(7,6))
fig.suptitle("Pareto Distribution vs. Normal Distribution", color = "r")

# Plot upper left: PDF Pareto
axs[0,0].set_xlim(left=0, right=(x_max/2))
axs[0,0].grid(visible=True, which='both', axis='both', color='darkgrey', linestyle='-', linewidth=0.25)
plt.xticks(np.arange(0, ((x_max/2)+1), step=1), fontsize = 10)  # Set label locations.
axs[0,0].set_title("PDF: Pareto", color = "b")
# Function
x=np.linspace(x_min, (x_max/2) , num=1000)
y = pareto_PDF (x, alpha)
axs[0,0].plot(x, y, 'b-', lw=2, alpha=1, label='pareto pdf')

# Plot upper right: PDF Normal
axs[0,1].set_xlim(left=-3, right=3)
axs[0,1].grid(visible=True, which='both', axis='both', color='darkgrey', linestyle='-', linewidth=0.25)
plt.xticks(np.arange(-3*var, 3*var, step=var), fontsize = 10)  # Set label locations.
axs[0,1].set_title("PDF: Normal", color = "g")
# Function
x = np.linspace(norm.ppf(0.01), norm.ppf(0.99), 100)
axs[0,1].plot(x, norm.pdf(x), 'g-', lw=2, alpha=1, label='norm pdf')

#Plot lower left: CDF Pareto
axs[1,0].set_xlim(left=0, right=x_max/2)
axs[1,0].grid(visible=True, which='both', axis='both', color='darkgrey', linestyle='-', linewidth=0.25)
plt.xticks(np.arange(0, ((x_max/2)+1), step=1), fontsize = 10)  # Set label locations.
axs[1,0].set_title("CDF: Pareto", color = "b")
# Function
x=np.linspace(x_min, (x_max/2) , num=1000)
y = pareto_CDF (x, alpha)
axs[1,0].plot(x, y, 'b-', lw=2, alpha=1, label='norm pdf')

#Plot lower right: CDF Normal
axs[1,1].set_xlim(left=-3, right=3)
axs[1,1].set_ylim(bottom=0, top=1.05)
axs[1,1].grid(visible=True, which='both', axis='both', color='darkgrey', linestyle='-', linewidth=0.25)
plt.xticks(np.arange(-3*var, 3*var, step=var), fontsize = 10)  # Set label locations.
axs[1,1].set_title("CDF: Normal", color = "g")
# Function
x = np.linspace(norm.ppf(0.01), norm.ppf(0.99), 1000)
axs[1,1].plot(x, norm.cdf(x), 'g-', lw=2, alpha=1, label='norm pdf')

for ax in axs.flat:
    ax.set(xlabel=None, ylabel=None)
    ax.set(yticklabels=[])
    ax.set(xticklabels=[])    
plt.show()

Pareto Principle Revisited¶

What is the Pareto principle?¶

Rationale for this article¶

Who was Pareto?¶

Controversies regarding Pareto¶

What has Pareto got to do with 'his' principle?¶

What did Pareto discover?¶

Pareto distribution¶

Visualization¶

Preliminaries¶

Propability density function (PDF)¶

Pareto on inequality¶

Pareto on historical trends¶

Pareto's power distribution¶

Cumulative distribution function (CDF)¶

What numeric values do we get from our exemplary shape parameter?¶

What about different shape parameters?¶

Discussion¶

Appendix: Pareto distribution vs. normal distribution¶