import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
from scipy import stats as st
from scipy import optimize
import seaborn as sns


#Defining the Utility function at time t, it returns negative such that scipy minimize can be used.
def Benefit(q, Health_factor):
    return Health_factor*np.log(q+1)


def Cost(q):
    return (np.exp(q/40) - 1)


q = np.linspace(0,160,160)


plt.figure(figsize=(16, 8), dpi=80)
for H in range(1, 11):
    plt.plot(q, Benefit(q,H), label = f"Benefit H={H}")

plt.plot(q, Cost(q), color = "red", label = "Costs")
plt.xlabel("Quantity (q)")
plt.ylabel("Value")
plt.legend()
plt.show()


def objective_function(q):
    return -(Benefit(q, Health_factor) - Cost(q))


for i in range (1,11):
    Health_factor = i
    print("The optimal q with a Health factor of ",Health_factor," is: ",optimize.minimize_scalar(objective_function).x)

The optimal q with a Health factor of  1  is:  22.04946882287033
The optimal q with a Health factor of  2  is:  33.56611349110644
The optimal q with a Health factor of  3  is:  41.5100503475735
The optimal q with a Health factor of  4  is:  47.6340206478508
The optimal q with a Health factor of  5  is:  52.64051156611696
The optimal q with a Health factor of  6  is:  56.88631665631836
The optimal q with a Health factor of  7  is:  60.57884633148013
The optimal q with a Health factor of  8  is:  63.849852728277206
The optimal q with a Health factor of  9  is:  66.78847404917059
The optimal q with a Health factor of  10  is:  69.4579427894475


List_optimal_q_per_health_factor = []
List_health_factor = []
for i in np.arange (1,11,0.01):
    Health_factor = i
    List_health_factor.append(i)
    List_optimal_q_per_health_factor.append(optimize.minimize_scalar(objective_function).x)

plt.figure(figsize=(8, 6), dpi=80)
plt.plot(List_health_factor, List_optimal_q_per_health_factor)
plt.xlabel("Health factor")
plt.ylabel("optimal q")
plt.show()


Health_factor = 1
Optimal_q_at_H1 = optimize.minimize_scalar(objective_function).x

Health_factor = 3
Optimal_q_at_H3 = optimize.minimize_scalar(objective_function).x

plt.figure(figsize=(10, 6), dpi=80)

plt.plot(q,Benefit(q,1), label = 'Health factor = 1') #plot of benefit with health factor 1
plt.plot(q,Benefit(q,3), label = 'Health factor = 3') #plot of benefit with health factor 2
plt.plot(q,Cost(q)) #plot of cost

#Below are the lines at the optimal q values for each health factor line
# plt.vlines create a vertical line at an x value with a ymin (start) and a ymax (end) of the line. The ymax here is the value of the outcome of the benefit funtion at a certain q with a certain health factor.
plt.vlines(x = Optimal_q_at_H1, ymin = 0, ymax = Benefit(Optimal_q_at_H1,1), label = "optimal q at H = 1", linestyle = ":" , colors = 'coral')
plt.vlines(x = Optimal_q_at_H3, ymin = 0, ymax = Benefit(Optimal_q_at_H3,3), label = "optimal q at H = 3", linestyle = ":" , colors = 'brown')

#Below is the line which shows what the value of the information rent should be
plt.vlines(x = Optimal_q_at_H1, ymin = Benefit(Optimal_q_at_H1,1), ymax = Benefit(Optimal_q_at_H1,3), label = "Information Rent",  color = "purple", linewidth = 2)

plt.xlim(0,120) #limit x axis from 0 to 100
plt.ylim(0,15) # limit y axis from 0 to 13
plt.legend()
plt.xlabel('Quantity (q)')
plt.ylabel('value')
plt.show()


Health_factor = 1
Optimal_q_at_H1 = optimize.minimize_scalar(objective_function).x

Health_factor = 3
Optimal_q_at_H3 = optimize.minimize_scalar(objective_function).x

#calcualting the value of the information rent
information_rent = Benefit(Optimal_q_at_H1,3) - Benefit(Optimal_q_at_H1,1)

plt.figure(figsize=(18, 11), dpi=80)

plt.plot(q,Benefit(q,1), label = 'Health factor = 1') #plot of benefit with health factor 1
plt.plot(q,Benefit(q,3), label = 'Health factor = 3') #plot of benefit with health factor 2
plt.plot(q,Cost(q)) #plot of cost

#Below are the lines at the optimal q values for each health factor line
# plt.vlines create a vertical line at an x value with a ymin (start) and a ymax (end) of the line. The ymax here is the value of the outcome of the benefit funtion at a certain q with a certain health factor.
plt.vlines(x = Optimal_q_at_H1, ymin = 0, ymax = Benefit(Optimal_q_at_H1,1), label = "optimal q at H = 1", linestyle = ":", colors = 'coral')
plt.vlines(x = Optimal_q_at_H3, ymin = 0, ymax = Benefit(Optimal_q_at_H3,3), label = "optimal q at H = 3", linestyle = ":", colors = 'brown')

#Below is the line which shows what the value of the information rent should be
plt.vlines(x = Optimal_q_at_H1, ymin = Benefit(Optimal_q_at_H1,1), ymax = Benefit(Optimal_q_at_H1,3), label = "Information Rent Calculation",  color = "purple", linewidth = 2, linestyle = ':')

#The infromation rent part that is subtracted from the original price of teh unhealthy types
plt.vlines(x = Optimal_q_at_H3, ymin = Benefit(Optimal_q_at_H3,3)-information_rent, ymax = Benefit(Optimal_q_at_H3,3), label = "Information Rent Substraction",  color = "purple", linewidth = 2)

#below I create the lines of the prices of the packages
plt.hlines(y = Benefit(Optimal_q_at_H1,1), xmin = 0, xmax = Optimal_q_at_H1, label = "optimal price at H = 1", linestyle = ":", colors = 'dimgrey')
plt.hlines(y = Benefit(Optimal_q_at_H3,3), xmin = 0, xmax = Optimal_q_at_H3, label = "price at H = 3 without information rent", linestyle = ":", colors = 'silver')
plt.hlines(y = Benefit(Optimal_q_at_H3,3)-information_rent, xmin = 0, xmax = Optimal_q_at_H3, label = "new price at H = 3 with information rent", linestyle = ":", linewidth = 2, colors = 'navy')

plt.xlim(0,120) #limit x axis from 0 to 100
plt.ylim(0,15) # limit y axis from 0 to 13
plt.legend()
plt.xlabel('Quantity (q)')
plt.ylabel('value')
plt.show()


def information_rent(Health_factor_healthy, Health_factor_unhealthy):
    Health_factor = Health_factor_healthy #set health factor to health facto healthy to find optimal_q for q_healthy
    res = optimize.minimize_scalar(objective_function) # optimizer to find q_healthy
    q = res.x #set q to q_healthy
    return Benefit(q,Health_factor_unhealthy) - Benefit(q, Health_factor_healthy) # return the infromation rent at q_healthy with two health factors


information_rent(1,6) #example calucaltion with health factor 1 and 6

18.748702633700553


def objective_function_insurer(params):
    q_healthy, q_unhealthy = params #the parameter which the optimize function will optimize, in this case the quantities of the two packages
    information_rent_q_healthy = Benefit(q_healthy ,Health_factor_unhealthy) - Benefit(q_healthy, Health_factor_healthy) #the calculation of the information rent
    Profit_on_healthy = Benefit(q_healthy, Health_factor_healthy) - Cost(q_healthy) # the calculation of the profit on the healthy at q_healthy
    Profit_on_unhealthy = Benefit(q_unhealthy, Health_factor_unhealthy) - information_rent_q_healthy - Cost(q_unhealthy) # the calculation of the profit on the unhealthy at q_unhealthy with the information rent
    
    return -(Profit_on_healthy + Profit_on_unhealthy) #the funtion returns the negative of the total profit because the optimize function optimizes the negative of the function.


bnds = ((0,160),(0,160)) #bounds used in optimzation. In this case both q_healthy and q_unhealthy cannot go below 0 and above 160


#defining the needed parameters of the objective_function_insurer:
Health_factor_healthy = 2
Health_factor_unhealthy = 3

#optimizing the profit of the insurer under the constraints and bounds given the choice functions of the healthy and unhealthy types
optimize_with_information_rent = optimize.minimize(objective_function_insurer, [10,40],method='Nelder-Mead',  bounds = bnds)


optimize_with_information_rent

 final_simplex: (array([[22.04945857, 41.51002997],
       [22.04945898, 41.51010004],
       [22.04940566, 41.51007456]]), array([-11.82860443, -11.82860443, -11.82860443]))
           fun: -11.828604426011676
       message: 'Optimization terminated successfully.'
          nfev: 87
           nit: 45
        status: 0
       success: True
             x: array([22.04945857, 41.51002997])


Health_factor = 2
optimal_q_H2 = optimize.minimize_scalar(objective_function).x
print("optimal q without infromation rent in the model at health factor ",Health_factor,": ",optimize.minimize_scalar(objective_function).x)

Health_factor = 3
print("optimal q without infromation rent in the model at health factor ",Health_factor,": ",optimize.minimize_scalar(objective_function).x)

print("optimal q with information rent in the model at health factor ",Health_factor,": ",optimize_with_information_rent.x[0])
print("optimal q with information rent in the model at health factor ",Health_factor,": ",optimize_with_information_rent.x[1])

print("This shows that the introduction of information rent in the model results in a decrease in q_healthy of: ",optimal_q_H2-optimize_with_information_rent.x[0])

optimal q without infromation rent in the model at health factor  2 :  33.56611349110644
optimal q without infromation rent in the model at health factor  3 :  41.5100503475735
optimal q with information rent in the model at health factor  3 :  22.049458570686852
optimal q with information rent in the model at health factor  3 :  41.51002996598079
This shows that the introduction of information rent in the model results in a decrease in q_healthy of:  11.51665492041959


#create two empty lists for both health factors
H_healthy_list = []
H_unhealthy_list = []

#create two lists with all the possible combinations of 0 to 10 with steps of 1
for i in range(1,11):
    for z in range(1,11):
        H_healthy_list.append(i)
        H_unhealthy_list.append(z)

#create dataframe with healthy and unhealthy health factors list     
combinations_df = pd.DataFrame({'H_healthy': H_healthy_list,
        'H_unhealthy': H_unhealthy_list})


#initializing lists which later will be added as columns to the dataframe
Optimal_q_healthy_without_inforent_list = []
Optimal_q_unhealthy_without_inforent_list = []
Optimal_q_healthy_with_inforent_list = []
Optimal_q_unhealthy_with_inforent_list = []
Information_rent_list = []


for index, row in combinations_df.iterrows(): #loop over the rows in the dataframe to calculate all of teh following functions for each combination
    if row['H_unhealthy'] < row['H_healthy']: #setting everything to 0 when unhealthy is lower than healthy because this is nto possible
        Optimal_q_healthy_without_inforent_list.append(0)
        Optimal_q_unhealthy_without_inforent_list.append(0)
        Optimal_q_healthy_with_inforent_list.append(0)
        Optimal_q_unhealthy_with_inforent_list.append(0)
        Information_rent_list.append(0)
        
    else:
        Health_factor_healthy = row['H_healthy']
        Health_factor_unhealthy = row['H_unhealthy']
        
        Health_factor = Health_factor_healthy #set health factor for original objective function without information rent
        Optimal_q_healthy_without_inforent_list.append( optimize.minimize_scalar(objective_function).x) #optimal q without information rent for the healthy type
        
        Health_factor = Health_factor_unhealthy #set health factor for original objective function without information rent
        Optimal_q_unhealthy_without_inforent_list.append(optimize.minimize_scalar(objective_function).x) #optimal q without information rent for the unhealthy type
        
        optimize_with_information_rent = optimize.minimize(objective_function_insurer, [10,40],method='Nelder-Mead',  bounds = bnds) #optimize function with information rent 
        
        Optimal_q_healthy_with_inforent_list.append(optimize_with_information_rent.x[0]) #optimal q with information rent for the healthy type
        Optimal_q_unhealthy_with_inforent_list.append(optimize_with_information_rent.x[1]) #optimal q with information rent for the unhealthy type
        
        #I also add a column with the information rent of each case
        Information_rent_list.append(Benefit(optimize_with_information_rent.x[0] ,Health_factor_unhealthy) - Benefit(optimize_with_information_rent.x[0], Health_factor_healthy))

        
combinations_df['Optimal_q_healthy_without_inforent'] = Optimal_q_healthy_without_inforent_list #create new column from list
combinations_df['Optimal_q_unhealthy_without_inforent'] = Optimal_q_unhealthy_without_inforent_list #create new column from list

combinations_df['Optimal_q_healthy_with_inforent'] = Optimal_q_healthy_with_inforent_list #create new column from list
combinations_df['Optimal_q_unhealthy_with_inforent'] = Optimal_q_unhealthy_with_inforent_list #create new column from list

combinations_df['Information_rent'] = Information_rent_list #create new column from list


combinations_df['Q_healthy_rationing'] = combinations_df['Optimal_q_healthy_without_inforent'] - combinations_df['Optimal_q_healthy_with_inforent']
combinations_df['Relative_Q_healthy_rationing'] = combinations_df['Q_healthy_rationing'] / combinations_df['Optimal_q_healthy_without_inforent']

combinations_df.head(5)


heatmap_data_informationrent = np.reshape(list(combinations_df['Information_rent']), (10,10)) #reshaping the column into a 10 by 10 matrix of combinations of ehalth factors
index_Health_factors = range(1,11) #health factors as index for the matrix

#create dataframe with column and index as health factors and the data is the matrix with a rounded value of 2 decimals.
informationrent_matrix = pd.DataFrame(heatmap_data_informationrent,columns=index_Health_factors,index=index_Health_factors).round(2)


plt.figure(figsize=(12, 10)) #set figsize
sns.set(font_scale=1) #set fontsize in figure

sns.heatmap(informationrent_matrix, #data
            cmap='coolwarm', #colorscheme
            annot=True, #number values in the heatmap are shown
            fmt='.5g', #formatting code for annotations to correctly show decimals
            vmax=15) #maximum value in heatmap to scale correctly

plt.title('Heatmap of information rent per health factor combination',fontsize=17) # set title
plt.xlabel('Health Factor of Unhealthy',fontsize=12) #set xlabel
plt.ylabel('Health Factor of Healthy',fontsize=12) #set ylabel

Text(84.5, 0.5, 'Health Factor of Healthy')


heatmap_data_rationing = np.reshape(list(combinations_df['Q_healthy_rationing']), (10,10))
index_Health_factors = range(1,11)

rationing_matrix = pd.DataFrame(heatmap_data_rationing,columns=index_Health_factors,index=index_Health_factors).round(1)


plt.figure(figsize=(12, 10))
sns.set(font_scale=1)

sns.heatmap(rationing_matrix,
            cmap='coolwarm',
            annot=True,
            fmt='.5g',
            vmax=60)

plt.title('Heatmap of rationing of q_healthy per health factor combination',fontsize=17)
plt.xlabel('Health Factor of Unhealthy',fontsize=12)
plt.ylabel('Health Factor of Healthy',fontsize=12)

Text(84.5, 0.5, 'Health Factor of Healthy')


heatmap_data_relative_rationing = np.reshape(list(combinations_df['Relative_Q_healthy_rationing']), (10,10))
index_Health_factors = range(1,11)

relative_rationing_matrix = pd.DataFrame(heatmap_data_relative_rationing,columns=index_Health_factors,index=index_Health_factors).round(1)


plt.figure(figsize=(12, 10))
sns.set(font_scale=1)

sns.heatmap(relative_rationing_matrix,
            cmap='coolwarm',
            annot=True,
            fmt='.5g',
            vmax=1)

plt.title('Heatmap of relative rationing of q_healthy per health factor combination',fontsize=17)
plt.xlabel('Health Factor of Unhealthy',fontsize=12)
plt.ylabel('Health Factor of Healthy',fontsize=12)

Text(84.5, 0.5, 'Health Factor of Healthy')


x = np.linspace(0, 10, 1000) #creates a numpy array consisting of values between 0 and 10 where the total data points is 1000 meaning that the step value is 0.01.
y1 = st.skewnorm.pdf(x, a= 0, loc = 0, scale = 2) 
plt.plot(x, y1) #plot of distribution
plt.xlabel('number')
plt.ylabel('Density')
plt.show()


np.random.seed(10) #set random seed such that the random sample is the same when rerunning the analysis
samples_health_factor = np.random.choice(x, size=1000, p=y1/np.sum(y1)) #random sample from x of size 1000 with probability of the pdf created above (y1)


df_samples = pd.DataFrame(data = {'samples_health_factor': samples_health_factor}) #Create dataframe with one column of samples_health_factor with the data of samples_health_factor


optimal_q_list = [] #initialize list
for i in df_samples['samples_health_factor']: #loop through rows in df
    Health_factor = i #set health factor as i to calculate optimal q using the objective function
    optimal_q_result = optimize.minimize_scalar(objective_function, bounds =  (0, 160), method='bounded') #optimize teh objective function using minimize_scalar
    optimal_q_list.append(float(optimal_q_result.x)) #appending the x attribute of the optimize outcome (the optimal q) to the optimal_q list


df_samples['optimal_q'] = optimal_q_list #adding the optimal_q list to the dataframe


df_samples.head() #head of dataframe as check that everything worked


def objective_function_insurer_population(params):
    q_healthy, q_unhealthy = params #optimize parameters
    
    profit = 0 #initialize profit at 0
    for index, row in df_samples.iterrows(): #for loop that loops over the rows in the dataframe
        if row['optimal_q'] < q_unhealthy: #when optimal q is lower than q_unhealthy
            profit_i = Benefit(q_healthy, row['samples_health_factor']) - Cost(q_healthy)
            
        else:
            profit_i = Benefit(q_unhealthy, row['samples_health_factor']) - Cost(q_unhealthy) 
        profit += profit_i #profit is the existing profiting + the profit of the current row in the for loop, this profit will increase the further teh loop is in the dataframe.
    
    return -(profit) #returns the negative of the profit because the optimizer optimizes the negative of the function.


bnds = ((0,160),(0,160)) # again bounds that both are between 0 and 160


#optimizing the profit of the insurer under the bounds given the choice functions of the healthy and unhealthy types
optimize_population = optimize.minimize(objective_function_insurer_population, [10,40], method='Nelder-Mead',  bounds = bnds) #10 and 40 are the initial guess and the method is nelder mead


optimize_population

 final_simplex: (array([[20.32466095, 33.86141037],
       [20.32457644, 33.86141037],
       [20.32469517, 33.86141036]]), array([-4369.47396675, -4369.47396673, -4369.4739667 ]))
           fun: -4369.473966745163
       message: 'Optimization terminated successfully.'
          nfev: 176
           nit: 92
        status: 0
       success: True
             x: array([20.32466095, 33.86141037])


def objective_function_insurer_population_with_information_rent(params):
    q_healthy, q_unhealthy = params
    
    profit = 0
    for index, row in df_samples.iterrows():
        if row['optimal_q'] < q_unhealthy:
            profit_i = Benefit(q_healthy, df_samples[df_samples['optimal_q']<q_unhealthy]['samples_health_factor'].mean()) - Cost(q_healthy)
            
        else: #Profit of the unhealthy is benefit-cost-information rent. 
            profit_i = Benefit(q_unhealthy, df_samples[df_samples['optimal_q']>q_unhealthy]['samples_health_factor'].mean()) - Cost(q_unhealthy) - (Benefit(q_healthy, df_samples[df_samples['optimal_q']>q_unhealthy]['samples_health_factor'].mean()) - Benefit(q_healthy, df_samples[df_samples['optimal_q']<q_unhealthy]['samples_health_factor'].mean()))
        profit += profit_i
    
    return -(profit)


bnds = ((0,160),(0,160)) #again the bounds that both parameters ahve to be between 0 and 160


#optimizing the profit of the insurer under the constraints and bounds given the choice functions of the healthy and unhealthy types
optimize_population_with_information_rent = optimize.minimize(objective_function_insurer_population_with_information_rent, [10,40],method='Nelder-Mead', bounds = bnds)


optimize_population_with_information_rent

 final_simplex: (array([[ 29.13075711, 134.81815466],
       [ 29.13075712, 134.81806335],
       [ 29.13075712, 134.81816103]]), array([-4242.49040235, -4242.49040235, -4242.49040235]))
           fun: -4242.490402354217
       message: 'Optimization terminated successfully.'
          nfev: 122
           nit: 55
        status: 0
       success: True
             x: array([ 29.13075711, 134.81815466])


df_samples['optimal_q'].max()

58.44503446321638

	H_healthy	H_unhealthy	Optimal_q_healthy_without_inforent	Optimal_q_unhealthy_without_inforent	Optimal_q_healthy_with_inforent	Optimal_q_unhealthy_with_inforent	Q_healthy_rationing	Relative_Q_healthy_rationing
0	1	1	22.049469	22.049469	22.049493	22.049447	-0.000024	-0.000001
1	1	2	22.049469	33.566113	0.000000	33.566148	22.049469	1.000000
2	1	3	22.049469	41.510050	0.000000	41.510018	22.049469	1.000000
3	1	4	22.049469	47.634021	0.000000	47.634043	22.049469	1.000000
4	1	5	22.049469	52.640512	0.000000	52.640540	22.049469	1.000000

	samples_health_factor	optimal_q
0	2.402402	37.053853
1	0.050050	0.954780
2	1.801802	31.660280
3	2.292292	36.144567
4	1.341341	26.595653

Introduction¶

Research question¶

Motivation¶

Preview of the answers¶

Main assumptions¶

Model in the paper¶

My extension to the model¶

Rationing of the healthy quantity¶

Population Healthcare Model¶

Python code¶

Importing libraries¶

Base Model¶

Market visualization graph¶

Objective function optimal quantity¶

Information rent¶

Graphical explanation of information rent¶

Infromation rent without rationing¶

Quantity rationing for the healthy types¶

Optimal quantity levels for both packages¶

Health Factor Combinations¶

Heatmaps of combinations¶

Information rent heatmap¶

Rationing Heatmap¶

Relative rationing heatmap¶

Representative population¶

Population optimization without information rent¶

population optimization with information rent -For future Research-¶

Discussion and conclusion¶

Research question¶

conclusion¶

discussion¶