# necessary imports
from scipy import optimize
from numpy import array,arange
import numpy as np
import matplotlib.pyplot as plt
%matplotlib inline
import pandas as pd 
import statsmodels.formula.api as sm
from math import log
from statsmodels.iolib.summary2 import summary_col #To include three regression models in one table.


# defining the production function for simulation
def production_function(K,L,alpha):
    return K**alpha*((A*L)**(1-alpha))


# range of Capital (K) to plot the graphs
range_K = arange(0.00,1300.0,0.01)


type(range_K)

numpy.ndarray


# some exogenous parameters
alpha = 1/3 #Share of capital 
A=1.5 #Technology level
s=0.3 #Savings rate
n=0.02 #Population growth
d=0.1 #Depreciation
g=0.1 #Technological growth
L=1 #Labour


plt.title("Production function",fontsize=15)
plt.xlabel("Capital(K)", fontsize=15)
plt.ylabel("Output (Y)",fontsize=15)
plt.plot(range_K,[production_function(i,L,alpha) for i in range_K],label="Y") 
#the above code line takes values from range_K array one by one and supplies to production_function to plot the graph

plt.legend() #legend box
plt.grid() #grid lines
plt.axis([-5, 50, -1, 6]) #this removes the extra part of the graph
plt.show()


# defining the production per effective worker function for simulation
def production_function_per_eff_w(K,alpha):
    return ((K/(A*L))**alpha)


plt.title("Production per effective worker function",fontsize=15)
plt.xlabel("Capital per effective worker (k)", fontsize=15)
plt.ylabel("Output per effective worker (y)",fontsize=15)
plt.plot(range_K/(A*L),[production_function_per_eff_w(i,alpha) for i in range_K],label="y")
#the above code line takes values from range_K array one by one and supplies to production_function_per_eff_w to plot the graph.
#in the above code line we have range_K/(A*L) because we defined range_K as Capital values but here we want Capital per effective worker on the x-axis. Therefore range_K is divided by (A*L).

plt.legend()
plt.grid()
plt.axis([-5, 50, -1, 6])#this removes the extra part of the graph
plt.show()


# defining the effective depreciation
def effective_depreciation(n,d,g,K):
    return (n+d+g)*(K/(A*L))


plt.title("Production per effective worker function",fontsize=15)
plt.xlabel("Capital per effective worker (k)", fontsize=15)
plt.ylabel("Output per effective worker (y)",fontsize=15)
plt.plot(range_K/(A*L),[production_function_per_eff_w(i,alpha)*s for i in range_K],label="s.y")
plt.plot(range_K/(A*L),[effective_depreciation(n,d,g,i) for i in range_K],label="(n+d+g).k")
#the above code line takes values from range_K array one by one and supplies to effective_depreciation to plot the graph
#in the above code line we have range_K/(A*L) because we defined range_K as Capital values but here we want Capital per effective worker on the x-axis. Therefore range_K is divided by (A*L).

plt.legend()
plt.grid()
plt.axis([-0.2, 4, -0.2, 1])#this removes the extra part of the graph
plt.show()


#solve for kstar
(s/(n+d+g))**(1/(1-alpha))

1.5923842039667508


initial_guess =1
kstar=optimize.fsolve(lambda w: ((production_function_per_eff_w(w*A*L,alpha)*s) - effective_depreciation(n,d,g,w*A*L)),initial_guess)
#optimize.fsolve will give such a value of w where (production_function_per_eff_w-effective_depreciation) is zero
#optimize.fsolve works on newton raphson method to find the solution and therefore it is required to provide a intial guess solution to optimize.fsolve
#inside the lambda function we need to multiply w with AL because both the functions (production_function_per_eff_w and effective_depreciation) takes Capital in argument and we need Capital per effective worker as the output of optimize.fsolve


kstar

array([1.5923842])


#plot kstar in graph
plt.title("Production per effective worker function",fontsize=15)
plt.xlabel("Capital per effective worker (k)", fontsize=15)
plt.ylabel("Output per effective worker (y)",fontsize=15)
plt.plot(range_K/(A*L),[production_function_per_eff_w(i,alpha) for i in range_K],label="y")
plt.plot(range_K/(A*L),[production_function_per_eff_w(i,alpha)*s for i in range_K],label="s.y")
plt.plot(range_K/(A*L),[effective_depreciation(n,d,g,i) for i in range_K],label="(n+d+g).k")
#in the above code line we have range_K/(A*L) because we defined range_K as Capital values but here we want Capital per effective worker on the x-axis. Therefore range_K is divided by (A*L).

plt.plot([kstar for i in range_K],[i for i in range_K],'--',label="kstar") #same xvalue (kstar) for different yvalues

plt.legend()
plt.grid()
plt.axis([-0.5, 10, -0.5, 2.5])
plt.show()


# GDP growth rate
print(round((g+n)*100,2),"percent")

12.0 percent


# set the saving rate in the economy to 30%
s=0.3


# intial values
K0 = 1 #Capital
L0 = 1 #Labor
A0 = 1 #Technology level
Y0=((A0*L0)**(1-alpha))*(K0**alpha) #from the production function
Y_AL0=Y0/(A0*L0) #Production per effective worker function
T=100 #Number of years


# intiating the lists of the main  variables for the dynamics
Time=[1901] #Year
L=[L0] #Labor
K=[K0] #Capital
A=[A0] #Technology level
Y=[Y0] #Output
Y_AL=[Y_AL0] #Production per effective worker function
for i in range(T):
    L.append((1+n)*L[i]) #for instance L1=(1+n)*L0
    A.append((1+g)*A[i]) #for instance A1=(1+g)*A0
    K.append((s*Y[i]) - (d*K[i]) + K[i]) #for instance K1=(s*Y0) - (d*K0) + K0
    Y.append(((A[i+1]*L[i+1])**(1-alpha))*(K[i+1]**alpha)) #for instance Y1=((A1*L1)**(1-alpha))*(K1**alpha)
    Y_AL.append(Y[i+1]/(A[i+1]*L[i+1])) #for instance Y_AL1=Y1/(A1*L1)
    Time.append(1+Time[i]) #for instance T1=1+T0


# creating the dataframe from the lists to plot the graphs
data = pd.DataFrame({'Time': Time,'Y': Y, 'K': K,'L':L,'A':A, 'Y/AL':Y_AL})
data


log_Y=[log(x) for x in Y] #Y reaches a very high value in 100 years therefore to plot it nicely we transform it to log values


fig, ax = plt.subplots(3,1,figsize=(14,16)) #3 subplots in 1 column.

#subplot 1 for Production per effective worker function
ax[0].plot(Time,Y_AL,'r',label='Y/AL') 
ax[0].set_title('Production per effective worker function',fontweight="bold")
ax[0].grid()
ax[0].legend()

#subplot 2 for Production
ax[1].plot(Time,Y,'b',label='Y') 
ax[1].ticklabel_format(style='plain')
ax[1].set_title('Production',fontweight="bold")
ax[1].grid()
ax[1].legend()

#subplot 3 for log Production
ax[2].plot(Time,log_Y,'g',label='log_Y')
ax[2].set_title('log Production',fontweight="bold")
ax[2].grid()
ax[2].legend()

#Common x-axis and y-axis labels for all the 3 subplots.
fig.supxlabel('Time')#labelling x-axis
fig.supylabel('Values')#labelling y-axis

plt.show()


s=[0.20,0.30,0.35,0.40,0.45] #list of different saving values
data_list=[]

#we have to run a for loop over savings list s to have the dynamics for every savings rate.
for s in s:
    # intial values
    K0 = 1 #Capital
    L0 = 1 #Labor
    A0 = 1 #Technology level
    Y0=((A0*L0)**(1-alpha))*(K0**alpha) #from the production function
    Y_AL0=Y0/(A0*L0) #Production per effective worker function
    T=100 #Number of years

    # intiating the lists of the main  variables
    Time=[1901] #Year
    L=[L0] #Labor
    K=[K0] #Capital
    A=[A0] #Technology level
    Y=[Y0] #Output
    Y_AL=[Y_AL0] #Production per effective worker function
    for i in range(T):
        L.append((1+n)*L[i])
        A.append((1+g)*A[i])
        K.append((s*Y[i]) - (d*K[i]) + K[i])
        Y.append(((A[i+1]*L[i+1])**(1-alpha))*(K[i+1]**alpha)) #explain i+1?
        Y_AL.append(Y[i+1]/(A[i+1]*L[i+1]))
        Time.append(1+Time[i])
    log_Y=[log(x) for x in Y]#Y reaches a very high value in 100 years therefore to plot it nicely we transform it to log values
    
    # creating the dataframes to plot the graphs
    data = pd.DataFrame({'Time': Time,'Y': Y, 'K': K,'L':L,'A':A, 'Y/AL':Y_AL,'log_Y':log_Y})
    data_list.append(data) #all dataframes of dynamics corresponding to different savings rate is stored in data_list


fig, ax = plt.subplots(3,1,figsize=(14,16)) #3 subplots in 1 column.

#subplot 1 for Production per effective worker function
ax[0].plot(data_list[0]['Time'],data_list[0]['Y/AL'],label='Y/AL at s=20%') #for 20% savings rate
ax[0].plot(data_list[1]['Time'],data_list[1]['Y/AL'],label='Y/AL at s=30%') #for 30% savings rate
ax[0].plot(data_list[2]['Time'],data_list[2]['Y/AL'],label='Y/AL at s=35%') #for 35% savings rate
ax[0].plot(data_list[3]['Time'],data_list[3]['Y/AL'],label='Y/AL at s=40%') #for 40% savings rate
ax[0].plot(data_list[4]['Time'],data_list[4]['Y/AL'],label='Y/AL at s=45%') #for 45% savings rate
ax[0].set_title('Production per effective worker function',fontweight="bold")
ax[0].grid()
ax[0].legend()

#subplot 2 for Production
ax[1].plot(data_list[0]['Time'],data_list[0]['Y'],label='Y at s=20%') #for 20% savings rate
ax[1].plot(data_list[1]['Time'],data_list[1]['Y'],label='Y at s=30%') #for 30% savings rate
ax[1].plot(data_list[2]['Time'],data_list[2]['Y'],label='Y at s=35%') #for 35% savings rate
ax[1].plot(data_list[3]['Time'],data_list[3]['Y'],label='Y at s=40%') #for 40% savings rate
ax[1].plot(data_list[4]['Time'],data_list[4]['Y'],label='Y at s=45%') #for 45% savings rate
ax[1].ticklabel_format(style='plain')
ax[1].set_title('Production',fontweight="bold")
ax[1].grid()
ax[1].legend()

#subplot 3 for log Production
ax[2].plot(data_list[0]['Time'],data_list[0]['log_Y'],label='log_Y at s=20%') #for 20% savings rate
ax[2].plot(data_list[1]['Time'],data_list[1]['log_Y'],label='log_Y at s=30%') #for 30% savings rate
ax[2].plot(data_list[2]['Time'],data_list[2]['log_Y'],label='log_Y at s=35%') #for 35% savings rate
ax[2].plot(data_list[3]['Time'],data_list[3]['log_Y'],label='log_Y at s=40%') #for 40% savings rate
ax[2].plot(data_list[4]['Time'],data_list[4]['log_Y'],label='log_Y at s=45%') #for 45% savings rate
ax[2].set_title('log Production',fontweight="bold")
ax[2].grid()
ax[2].legend()

fig.supxlabel('Time')#labelling x-axis
fig.supylabel('Values')#labelling y-axis

plt.show()


data_url = 'https://www.ssc.wisc.edu/~bhansen/econometrics/MRW1992.xlsx'


#creating the main dataframe df for the analysis
df = pd.read_excel(data_url)


df.head() #this shows the first five observations


df.describe() #This gives a very basic understanding of the data


df[df['N']==1].describe() #This gives the data description of non oil countries only


df[df['I']==1].describe() #This gives the data description of intermediate countries only


df[df['O']==1].describe() #This gives the data description of OECD countries only


fig, ax = plt.subplots(figsize=(25,9))
ax.set_title('real GDP per working-age person in 1985, in dollars',fontweight="bold")
ax.bar(df.sort_values('Y85')['country'],df.sort_values('Y85')['Y85']) #sort and bar plot in one line
ax.xaxis.set_tick_params(rotation=90) #to rotate the xlabels
plt.axhline(y = df['Y85'].mean(),color='r', label='mean Y85') #for mean horizontal line
ax.set_xlabel('Countries')
ax.set_ylabel('Value in dollars')
plt.legend()
plt.grid()
plt.show()


fig, ax = plt.subplots(figsize=(25,9))
ax.set_title('The yearly average growth rate (%) of the working-age population for 1960-1985',fontweight="bold")

ax.bar(df.sort_values('pop_growth')['country'],df.sort_values('pop_growth')['pop_growth'])#sort and bar plot in one line
plt.axhline(y = df['pop_growth'].mean(),color='r', label='mean pop_growth')#for mean horizontal line
ax.set_xlabel('Countries')
ax.set_ylabel('Value in %')
plt.legend()
ax.xaxis.set_tick_params(rotation=90)#to rotate the xlabels
plt.grid()
plt.show()


fig, ax = plt.subplots(figsize=(25,9))
ax.set_title('The share (%) of real investment (incl. government investment) in real GDP, averaged for 1960-1985',fontweight="bold")

ax.bar(df.sort_values('invest')['country'],df.sort_values('invest')['invest'])#sort and bar plot in one line
plt.axhline(y = df['invest'].mean(),color='r', label='mean invest')#for mean horizontal line
ax.set_xlabel('Countries')
ax.set_ylabel('Value in %')
plt.legend()
ax.xaxis.set_tick_params(rotation=90)#to rotate the xlabels
plt.grid()
plt.show()


fig, ax = plt.subplots(figsize=(15,5))
ax.set_title('Real GDP 1985 vs Savings rate',fontweight="bold")

ax.scatter(df['invest']/100,df['Y85'])
ax.set_xlabel('investment rate (proxy for savings rates)')
ax.set_ylabel('real GDP per working-age person in 1985, in dollars')
ax.xaxis.set_tick_params(rotation=90)
plt.grid()
plt.show()


df.head()


#getting log variables to run the regressions

df['log_Y85']=np.log(df['Y85'])
df['log_s']=np.log(df['invest']/100) # MRW 1992 calculate savings rate with investment as a proxy for savings
df['log_school']=np.log(df['school']/100)
df['log_ngd']=np.log((df['pop_growth']/100)+0.05) #we calculate (n+g+delta) using population growth (n) and 
#adding 0.05, since MRW 1992 assume that g + delta is 0.05


#Unrestricted regression for non oil countries
reg1 = sm.ols("log_Y85 ~ log_s+ log_ngd",data=df[df['N']==1]).fit()

#Unrestricted regression for Intermediate countries
reg2 = sm.ols("log_Y85 ~ log_s+ log_ngd",data=df[df['I']==1]).fit()

#Unrestricted regression for OECD countries
reg3 = sm.ols("log_Y85 ~ log_s+ log_ngd",data=df[df['O']==1]).fit()

#Below is the syntax for sm.ols
#sm.ols("dependent variable ~ independent variable 1 + independent variable 2 +...., data=dataframe").fit()


df['s_minus_ngd']=df['log_s'] - df['log_ngd'] 
#We take differences to impose the condition that both coefficients have to be of same magnitude with opposite sign.


#Restricted regression for non oil countries
reg1_restricted = sm.ols("log_Y85 ~ s_minus_ngd",data=df[df['N']==1]).fit()

#Restricted regression for Intermediate countries
reg2_restricted = sm.ols("log_Y85 ~ s_minus_ngd",data=df[df['I']==1]).fit()

#Restricted regression for OECD countries
reg3_restricted = sm.ols("log_Y85 ~ s_minus_ngd",data=df[df['O']==1]).fit()


info_dictu = {'N': lambda x: x.nobs,'s.e.e.': lambda x: np.sqrt(x.scale)} 
# above code adds extra info in unrestricted regression table like number of observations and standard error of estimate

info_dictr = {'N': lambda x: x.nobs, 's.e.e.': lambda x: np.sqrt(x.scale),
             'Implied α': lambda x: f"{x.params[1]/(1 + x.params[1]):.2f}"}
# above code adds extra info in restricted regression table like number of observations, standard error of estimate and Implied alpha.
# implied alpha calculation: (alpha/(1-alpha))=params[1], now solve for alpha we get alpha=params[1]/(1+params[1]). Refer MRW 1992
# params[1] gives you the coefficient of 1st independent variable in the regression.



results_unres = summary_col(results = [reg1, reg2, reg3],float_format='%0.3f',stars = True,
                           model_names = ['Non-Oil','Intermediate','OECD'], 
                           info_dict = info_dictu, regressor_order = ['Intercept','log_s','log_ngd'])
#model_names for Column heading
#info_dict to add extra info
#float_format='%0.3f' : print results upto three decimal places
#in unrestricted table, implied alpha is not required.
#regressor_order tells you what independent variables you want to print first.

results_res = summary_col(results = [reg1_restricted, reg2_restricted, reg3_restricted],float_format='%0.3f',
                          stars = True, model_names = ['Non-Oil','Intermediate','OECD'],
                          info_dict = info_dictr,regressor_order = ['Intercept','s_minus_ngd'])
                                             

results_unres.add_title('Unrestricted Regressions')
results_res.add_title('Restricted Regressions')


print(results_unres)

print('\n') #add some space between the two tables

print(results_res)

           Unrestricted Regressions
==============================================
                Non-Oil  Intermediate   OECD  
----------------------------------------------
Intercept      5.430***  5.346***     8.021***
               (1.584)   (1.543)      (2.518) 
log_s          1.424***  1.318***     0.500   
               (0.143)   (0.171)      (0.434) 
log_ngd        -1.990*** -2.017***    -0.742  
               (0.563)   (0.534)      (0.852) 
R-squared      0.601     0.599        0.106   
R-squared Adj. 0.592     0.588        0.012   
N              98.0000   75.0000      22.0000 
s.e.e.         0.6891    0.6106       0.3774  
==============================================
Standard errors in parentheses.
* p<.1, ** p<.05, ***p<.01


           Restricted Regressions
=============================================
               Non-Oil  Intermediate   OECD  
---------------------------------------------
Intercept      6.872*** 7.093***     8.624***
               (0.121)  (0.146)      (0.533) 
s_minus_ngd    1.488*** 1.431***     0.554   
               (0.125)  (0.139)      (0.365) 
R-squared      0.597    0.592        0.103   
R-squared Adj. 0.593    0.586        0.058   
N              98.0000  75.0000      22.0000 
s.e.e.         0.6885   0.6119       0.3684  
Implied α      0.60     0.59         0.36    
=============================================
Standard errors in parentheses.
* p<.1, ** p<.05, ***p<.01


fig, ax = plt.subplots(figsize=(25,9))
ax.set_title('Fraction invested in human capital',fontweight="bold")
ax.bar(df.sort_values('school')['country'],df.sort_values('school')['school'])#sort and bar plot in one line
ax.xaxis.set_tick_params(rotation=90)#to rotate the xlabels
plt.axhline(y = df['school'].mean(),color='r', label='mean school')#for mean horizontal line
ax.set_xlabel('Countries')
ax.set_ylabel('Value in %')
plt.legend()
plt.grid()
plt.show()


#Unrestricted regression for non oil countries
reg1_hc = sm.ols("log_Y85 ~ log_s+ log_ngd + log_school",data=df[df['N']==1]).fit()

#Unrestricted regression for Intermediate countries
reg2_hc = sm.ols("log_Y85 ~ log_s+ log_ngd+ log_school",data=df[df['I']==1]).fit()

#Unrestricted regression for OECD countries
reg3_hc = sm.ols("log_Y85 ~ log_s+ log_ngd+ log_school",data=df[df['O']==1]).fit()


df['school_minus_ngd']=df['log_school'] - df['log_ngd'] #We take differences to impose the condition that
#(n+g+\delta), s_h and s_k coefficients sum to 0.


#Restricted regression for non oil countries
reg1_restricted_hc = sm.ols("log_Y85 ~ s_minus_ngd + school_minus_ngd ",data=df[df['N']==1]).fit()

#Restricted regression for Intermediate countries
reg2_restricted_hc = sm.ols("log_Y85 ~ s_minus_ngd + school_minus_ngd",data=df[df['I']==1]).fit()

#Restricted regression for OECD countries
reg3_restricted_hc = sm.ols("log_Y85 ~ s_minus_ngd + school_minus_ngd",data=df[df['O']==1]).fit()


info_dictu = {'N': lambda x: x.nobs,'s.e.e.': lambda x: np.sqrt(x.scale)}
# above code adds extra info in unrestricted regression table like number of observations and standard error of estimate

info_dictr = {'N': lambda x: x.nobs,'s.e.e.': lambda x: np.sqrt(x.scale),
              'Implied α': lambda x: f"{x.params[1]/(1 + x.params[1] + x.params[2]):.3f}",
              'Implied β': lambda x: f"{x.params[2]/(1 + x.params[1] + x.params[2]):.3f}"}
# above code adds extra info in restricted regression table like number of observations, standard error of estimate and implied alpha & beta.
# implied alpha & beta calculation: refer the markdown cell after this code
# params[1] gives you the coefficient of 1st independent variable in the regression.
# params[2] gives you the coefficient of 2nd independent variable in the regression.

results_unres = summary_col(results = [reg1_hc, reg2_hc, reg3_hc],float_format='%0.3f',stars = True,
                            model_names = ['Non-Oil','Intermediate','OECD'],info_dict = info_dictu,
                            regressor_order = ['Intercept','log_s','log_ngd','log_school'])

#model_names for Column heading
#info_dict to add extra info
#float_format='%0.3f' : print results upto three decimal places
#in unrestricted table, implied alpha & beta is not required.
#regressor_order tells you what independent variables you want to print first.

results_res = summary_col(results = [reg1_restricted_hc, reg2_restricted_hc, reg3_restricted_hc],float_format='%0.3f',
                          stars = True,model_names = ['Non-Oil','Intermediate','OECD'],info_dict = info_dictr,
                          regressor_order = ['Intercept','s_minus_ngd','school_minus_ngd'])


results_res.add_title('Restricted Regressions')
results_unres.add_title('Unrestricted Regressions')
print(results_unres)
print('\n')
print(results_res)

           Unrestricted Regressions
==============================================
                Non-Oil  Intermediate   OECD  
----------------------------------------------
Intercept      6.844***  7.791***     8.637***
               (1.177)   (1.192)      (2.214) 
log_s          0.697***  0.700***     0.276   
               (0.133)   (0.151)      (0.389) 
log_ngd        -1.745*** -1.500***    -1.076  
               (0.416)   (0.403)      (0.756) 
log_school     0.654***  0.731***     0.768** 
               (0.073)   (0.095)      (0.293) 
R-squared      0.786     0.781        0.352   
R-squared Adj. 0.779     0.771        0.244   
N              98.0000   75.0000      22.0000 
s.e.e.         0.5077    0.4547       0.3300  
==============================================
Standard errors in parentheses.
* p<.1, ** p<.05, ***p<.01


            Restricted Regressions
===============================================
                 Non-Oil  Intermediate   OECD  
-----------------------------------------------
Intercept        7.853*** 7.966***     8.716***
                 (0.140)  (0.154)      (0.466) 
s_minus_ngd      0.738*** 0.709***     0.283   
                 (0.124)  (0.138)      (0.334) 
school_minus_ngd 0.657*** 0.733***     0.769** 
                 (0.073)  (0.093)      (0.284) 
R-squared        0.784    0.781        0.352   
R-squared Adj.   0.779    0.775        0.284   
N                98.0000  75.0000      22.0000 
s.e.e.           0.5070   0.4516       0.3212  
Implied α        0.308    0.290        0.138   
Implied β        0.274    0.300        0.375   
===============================================
Standard errors in parentheses.
* p<.1, ** p<.05, ***p<.01

	Time	Y	K	L	A	Y/AL
0	1901	1.000000	1.000000	1.000000	1.000000	1.000000
1	1902	1.147420	1.200000	1.020000	1.100000	1.022656
2	1903	1.311747	1.424226	1.040400	1.210000	1.041992
3	1904	1.495153	1.675327	1.061208	1.331000	1.058539
4	1905	1.700053	1.956341	1.082432	1.464100	1.072731
...	...	...	...	...	...	...
96	1997	73231.567838	98961.545216	6.692933	9412.343651	1.162476
97	1998	82165.820918	111034.861046	6.826792	10353.578016	1.162476
98	1999	92190.052827	124581.121217	6.963328	11388.935818	1.162476
99	2000	103437.240983	139780.024943	7.102594	12527.829400	1.162476
100	2001	116056.586050	156833.194744	7.244646	13780.612340	1.162476

	country	N	I	Y60	Y85	Y_growth	pop_growth	invest	school
0	Algeria	1	1	2485.0	4371.0	4.8	2.6	24.1	4.5
1	Angola	1	0	1588.0	1171.0	0.8	2.1	5.8	1.8
2	Benin	1	0	1116.0	1071.0	2.2	2.4	10.8	1.8
3	Botswana	1	1	959.0	3671.0	8.6	3.2	28.3	2.9
4	Burkina Faso	1	0	529.0	857.0	2.9	0.9	12.7	0.4

	N	I	O	Y60	Y85	Y_growth	pop_growth	invest	school
count	121.000000	121.000000	121.000000	116.000000	108.000000	117.000000	107.000000	121.000000	118.000000
mean	0.809917	0.619835	0.181818	3681.818966	5683.259259	4.094017	2.279439	18.157025	5.526271
std	0.393998	0.487446	0.387298	7492.877637	5688.670819	1.891464	0.998748	7.853310	3.532037
min	0.000000	0.000000	0.000000	383.000000	412.000000	-0.900000	0.300000	4.100000	0.400000
25%	1.000000	0.000000	0.000000	973.250000	1209.250000	2.800000	1.700000	12.000000	2.400000
50%	1.000000	1.000000	0.000000	1962.000000	3484.500000	3.900000	2.400000	17.700000	4.950000
75%	1.000000	1.000000	0.000000	4274.500000	7718.750000	5.300000	2.900000	24.100000	8.175000
max	1.000000	1.000000	1.000000	77881.000000	25635.000000	9.200000	6.800000	36.900000	12.100000

	N	I	O	Y60	Y85	Y_growth	pop_growth	invest	school
count	98.0	98.000000	98.000000	98.000000	98.000000	98.000000	98.000000	98.000000	98.000000
mean	1.0	0.765306	0.224490	2994.897959	5309.765306	3.994898	2.201020	17.672449	5.396939
std	0.0	0.425986	0.419391	2862.521970	5277.182620	1.859130	0.889862	7.918330	3.468992
min	1.0	0.000000	0.000000	383.000000	412.000000	-0.900000	0.300000	4.100000	0.400000
25%	1.0	1.000000	0.000000	963.750000	1174.750000	2.725000	1.700000	11.725000	2.400000
50%	1.0	1.000000	0.000000	1818.000000	3150.000000	3.800000	2.400000	17.100000	4.750000
75%	1.0	1.000000	0.000000	4113.250000	7015.000000	5.100000	2.875000	23.400000	8.000000
max	1.0	1.000000	1.000000	12362.000000	19723.000000	9.200000	4.300000	36.900000	11.900000

	N	I	O	Y60	Y85	Y_growth	pop_growth	invest	school
count	75.0	75.0	75.000000	75.000000	75.000000	75.000000	75.000000	75.000000	75.000000
mean	1.0	1.0	0.293333	3620.760000	6589.826667	4.381333	2.166667	19.350667	6.381333
std	0.0	0.0	0.458356	2999.976459	5410.907211	1.736235	0.975141	7.565951	3.233093
min	1.0	1.0	0.000000	383.000000	608.000000	0.900000	0.300000	5.400000	0.500000
25%	1.0	1.0	0.000000	1347.000000	2167.000000	3.250000	1.450000	13.250000	3.650000
50%	1.0	1.0	0.000000	2382.000000	4492.000000	4.100000	2.400000	19.500000	6.600000
75%	1.0	1.0	1.000000	5016.000000	11183.500000	5.450000	2.900000	24.700000	8.900000
max	1.0	1.0	1.000000	12362.000000	19723.000000	9.200000	4.300000	36.900000	11.900000

Mankiw Romer Weil (1992)¶

Introduction & motivation¶

Research Questions:¶

The Solow Model: derivation and simulation¶

Assumptions of the Solow model¶

Analytics of the Solow model¶

Dynamics of the Solow model¶

Sensitivity analysis of the Solow model¶

Empirical testing of the Solow Model¶

Econometric Specification, assumptions & preview of the answer¶

Data:¶

Variable definitions:¶

Regression Analysis¶

Results¶

Empirical testing of the augmented Solow model¶

Augmented Solow Model¶

Econometric Specification, assumptions & preview of the answer¶

Data and subsamples¶

Regression Analysis¶

Results¶

Conclusions and discussion:¶

References¶

	N	I	O	Y60	Y85	Y_growth	pop_growth	invest	school
count	22.0	22.0	22.0	22.000000	22.000000	22.000000	22.000000	22.000000	22.000000
mean	1.0	1.0	1.0	6731.090909	13131.454545	3.868182	1.009091	25.790909	9.086364
std	0.0	0.0	0.0	2803.653380	4012.491694	0.994454	0.605459	4.985972	2.080361
min	1.0	1.0	1.0	2257.000000	4444.000000	2.500000	0.300000	17.700000	4.800000
25%	1.0	1.0	1.0	4536.500000	11388.500000	3.225000	0.600000	22.700000	7.925000
50%	1.0	1.0	1.0	7424.500000	13594.000000	3.750000	0.750000	25.350000	9.100000
75%	1.0	1.0	1.0	8314.500000	15282.000000	4.275000	1.350000	28.950000	10.700000
max	1.0	1.0	1.0	12362.000000	19723.000000	6.800000	2.500000	36.900000	11.900000