# For REPL setting
ENV["LINES"] = 1000; ENV["COLUMNS"] = 250;
## In Julia, you can activate virtual environment you compiled in REPL
using Pkg; Pkg.activate("./")
using Distributed;
addprocs(7; exeflags=`--project=$(Base.active_project())`); # choose "the number of CPU's -1"
@everywhere begin 
    using SharedArrays, LinearAlgebra, Optim, ForwardDiff, NLSolversBase, Ipopt, Zygote,
        DataFrames, Printf, Random, Distributions, Statistics, HypothesisTests, TimeSeries, SharedArrays,
        Distances, Plots, Printf, LaTeXStrings, PlotThemes, .MathConstants; # for γ=0.5772...
end
#=
Distributed.jl is used for parallelization
@everywhere is a macro to tell all the processors do the commands that follow
@distributed is a macro to tell all the processors share the work on the loop
SharedArrays{T} type is a type of Arrays that multiple processors can have access
@sync is a macro to tell the processors do the loop in a synchronized manner
=#


Random.seed!(42) # random number generator for replicability
function simulation_static(γ, δ, w, N)
    γData = zeros(N);
    δData = zeros(N);
    dData = zeros(N);
    xData = zeros(N);
    function d_static(γ,δ,w)
        # Decision rule in a static case
        if γ/(γ+δ)>w
            return 1
        else
            return 0
        end
    end;
    # Flip a coin for each agent 'i' whose probability of success is ξ[i].
    # We record the result of inventing in xData. 0 in this case means either:
    #   i)  the agent tried inventing and failed, or
    #   ii) the agent did not try inventing. We need to look at dData to see why we observe 0 here.
    # '.' broadcasts operations element-wise. 
    # Read https://julia.quantecon.org/getting_started_julia/julia_by_example.html for details.
    γData .= γ;
    δData .= δ;
    dData  = d_static.(γData,δData,w);
    ξ = rand(Beta(γ,δ),N) # Draw a random number ξ ~ Beta(γ,δ) N-times.
    xData = rand.(Bernoulli.(ξ)) .* dData;
    @printf("γ=%4.2f, δ=%4.2f, w=%4.2f", γ, δ, w);
    @printf(", N=%4.0f, d=1: %5.0f, x=1: %5.0f \n", N,sum(dData),sum(xData))
end
simulation_static(3.0,1.0,0.65,10_000)
simulation_static(3.0,1.0,0.85,10_000)

γ=3.00, δ=1.00, w=0.65, N=10000, d=1: 10000, x=1:  7432 
γ=3.00, δ=1.00, w=0.85, N=10000, d=1:     0, x=1:     0


function u(j,γ,δ,w)
    # Per-period utility function
    return j * γ/(γ+δ) + (1-j) * w
end

function Val_2(γ,δ,w,t,β)
    # The value function for the two-period model
    # findmin(itr)[1] returns maximum value
    if t==2
        return findmax([u(j,γ,δ,w) for j=0:1])[1]
    else
        return findmax([u(j,γ,δ,w) + β*(j*(γ/(γ+δ) * Val_2(γ+1,δ,w,t+1,β) + δ/(γ+δ) * Val_2(γ,δ+1,w,t+1,β))+
                                        (1-j)*Val_2(γ,δ,w,t+1,β)) for j=0:1])[1]
    end
end

function d_dyn_2(γ,δ,w,t,β)
    # The policy function for the two-period model
    # findmin(itr)[2] is argmax. "-1" is there to match the index in Julia (1,2) to our choice index (0,1)
    if t==2
        return findmax([u(j,γ,δ,w) for j=0:1])[2]-1 
    else
        return findmax([u(j,γ,δ,w) + β*(j*(γ/(γ+δ) * Val_2(γ+1,δ,w,t+1,β) + δ/(γ+δ) * Val_2(γ,δ+1,w,t+1,β))+
                                        (1-j)*Val_2(γ,δ,w,t+1,β)) for j=0:1])[2]-1
    end
end

function simul_data(N,T,γ,δ,w,β)
    # Data storage
    γData = zeros(N,T);
    δData = zeros(N,T);
    dData = zeros(N,T);
    xData = zeros(N,T);
    #=
    Again, everyone has different ξ, but each person retains ξ over time (i.e., no learning by doing).
    We only get to know 'how good we are' as we invent and observe outcomes.
    =#
    γData[:,1] .= γ;
    δData[:,1] .= δ;
    ξ = rand(Beta(γ,δ),N);
    #=
    broadcast() applies the function d_dyn_2 that takes 4 scalar arguments and
    applies it element-wise over the vectors γData[:,1] and δData[:,1]
    while fixing w,1,β as scalars.
    =#
    dData[:,1] = broadcast(d_dyn_2,γData[:,1],δData[:,1],w,1,β);
    xData[:,1] = rand.(Bernoulli.(ξ)) .* dData[:,1];
    for t=2:T
        γData[:,t] .= γData[:,t-1] + dData[:,t-1] .* (1 .* xData[:,t-1])
        δData[:,t] .= δData[:,t-1] + dData[:,t-1] .* (1 .* (1 .- xData[:,t-1]))
        dData[:,t] .= broadcast(d_dyn_2,γData[:,t],δData[:,t],w,t,β)
        xData[:,t] .= rand.(Bernoulli.(ξ)) .* dData[:,t];
    end
    return γData, δData, dData, xData, ξ
end;


γ=2.3; δ=2.0; β=0.96;
w⃰ = (γ/(γ+δ))*(1+β*(γ+1)/(γ+δ+1))/(1+β*γ/(γ+δ))
cvf= [(u(j,γ,δ,w⃰) + β*(j*(γ/(γ+δ) * Val_2(γ+1,δ,w⃰,2,β) + δ/(γ+δ) * Val_2(γ,δ+1,w⃰,2,β))+(1-j)*Val_2(γ,δ,w⃰,2,β))) for j=0:1];

# Print CVF when w=w⃰
print("w⃰: ",w⃰,"\n")
print("Choice-specific Conditional Value Function at t=1 when γ=$γ, δ=$δ, β=$β, w=w⃰ \n")
@printf(" - v₀(γ,δ,w⃰,1,β) = %1.12f \n",cvf[1])
@printf(" - v₁(γ,δ,w⃰,1,β) = %1.12f",cvf[2])

w⃰: 0.5646577217010124
Choice-specific Conditional Value Function at t=1 when γ=2.3, δ=2.0, β=0.96, w=w⃰ 
 - v₀(γ,δ,w⃰,1,β) = 1.106729134534 
 - v₁(γ,δ,w⃰,1,β) = 1.106729134534


function logLikelihood(γ,δ,dData)
    γ = γ[1]
    return -sum(dData[:,2].*(log(γ)-log(γ+δ)).+(1.0 .- dData[:,2]).*(log(δ)-log(γ+δ)))
end

function γ_estimation(δ,dData)
    N = size(dData)[1]
    γhat = (δ * sum(dData[:,2])) / (N-sum(dData[:,2]))
    I   = δ / (γhat * (γhat+δ))
    I_n = N * δ / (γhat*(γhat+δ)^2)
    se  = sqrt(1 / I_n)
    return γhat, se
end;


Random.seed!(42)
T=2;γ=3.0;δ=2.0;w=0.55;β=0.96;
N_vec = [50,500,10_000,100_000,500_000]
result_2 = Array{Float64}(zeros(length(N_vec),2,2))
h_rate_2 = Vector{Float64}(zeros(length(N_vec)))
_, _, dData, _, _ = simul_data(N_vec[end],T,γ,δ,w,β);
for i=1:length(N_vec)
    N = N_vec[i]
    h_rate_2[i] = sum((dData[1:N,1].==1).&(dData[1:N,2].==0))/sum((dData[1:N,1].==1))
    result_2[i,1,1], result_2[i,1,2] = γ_estimation(δ,dData[1:N,:])
    # We can also use Optim.jl to tell the program to find the MLE estimate for us
    func = TwiceDifferentiable(x -> logLikelihood(x[1],δ,dData[1:N,:]),[1.0]);
    optim = optimize(func,[1.0])
    result_2[i,2,1] = optim.minimizer[1]
    result_2[i,2,2] = sqrt(inv(Optim.hessian!(func,optim.minimizer)))[1]
end


# Print MLE estimation results
print("---------------- Estimating γ in a Two-Period Model -----------------\n")
print("Parameters: γ=$γ, δ=$δ, w=$w, β=$β, T=$T \n")
@printf("Hazard Rate: Data vs Theory \n")
print("=====================================================================\n")
@printf("N     ||"); [@printf(" %7i |", i) for i in N_vec]; @printf("|  Theory |\n") 
@printf("h₂    ||"); [@printf(" %1.5f |", i) for i in h_rate_2[:]]; @printf("| %1.5f |\n",δ/(γ+δ))
print("=====================================================================\n")

@printf("Estimation Result for γ: \n")
print("=============================================================\n")
@printf("MLE \\ N  ||"); [@printf(" %7i |", i) for i in N_vec]; @printf("\n")
print("-------------------------------------------------------------\n")
@printf("By hand  ||"); [@printf(" %1.5f |", i) for i in result_2[:,1,1]]; @printf("\n")
@printf("         ||"); [@printf("(%1.5f)|", i) for i in result_2[:,1,2]]; @printf("\n")
print("-------------------------------------------------------------\n")
@printf("Optim.jl ||"); [@printf(" %1.5f |", i) for i in result_2[:,2,1]]; @printf("\n")
@printf("         ||"); [@printf("(%1.5f)|", i) for i in result_2[:,2,2]]; @printf("\n")
print("=============================================================\n")
@printf("Standard errors in parentheses.")

---------------- Estimating γ in a Two-Period Model -----------------
Parameters: γ=3.0, δ=2.0, w=0.55, β=0.96, T=2 
Hazard Rate: Data vs Theory 
=====================================================================
N     ||      50 |     500 |   10000 |  100000 |  500000 ||  Theory |
h₂    || 0.34000 | 0.38800 | 0.40000 | 0.40192 | 0.40010 || 0.40000 |
=====================================================================
Estimation Result for γ: 
=============================================================
MLE \ N  ||      50 |     500 |   10000 |  100000 |  500000 |
-------------------------------------------------------------
By hand  || 3.88235 | 3.15464 | 3.00000 | 2.97611 | 2.99870 |
         ||(1.15904)|(0.28952)|(0.06124)|(0.01920)|(0.00866)|
-------------------------------------------------------------
Optim.jl || 3.88235 | 3.15464 | 3.00000 | 2.97611 | 2.99870 |
         ||(1.15904)|(0.28952)|(0.06124)|(0.01920)|(0.00866)|
=============================================================
Standard errors in parentheses.


@everywhere function VFI(γ,δ,w,β,T;print_flag=1)
    γ_vec = collect(γ:γ+T);
    δ_vec = collect(δ:δ+T);
    V  = Matrix{Float64}( w/(1-β) .* ones(length(γ_vec),length(δ_vec)));
    v₀ = Matrix{Float64}(zeros(length(γ_vec),length(δ_vec)));
    v₁ = Matrix{Float64}(zeros(length(γ_vec),length(δ_vec)));
    d  = Matrix{Float64}(zeros(length(γ_vec),length(δ_vec)));
    max_distance = 1.0
    euc_distance = 1.0
    num_iter = 0
    tol = 1e-16
    max_steps = 2000
    while (max_distance>tol && euc_distance>tol && num_iter<=2000)
        # initialization
        V_next = Matrix{Float64}(zeros(length(γ_vec),length(δ_vec)));
        for i = 1:length(γ_vec)
            for j = 1:length(δ_vec)
                # we clip the value function if we reach the boundary of the grid
                if i+1 < length(γ_vec)
                    V_success = V[i+1,j]
                else
                    V_success = V[i,j]
                end
                if j+1 < length(δ_vec)
                    V_fail = V[i,j+1]
                else
                    V_fail = V[i,j]
                end
                # Probability of success and fail
                P_success = γ_vec[i]/(γ_vec[i]+δ_vec[j])
                P_fail = δ_vec[j]/(γ_vec[i]+δ_vec[j])
                # Conditional value functions
                v₀[i,j] = w + β * V[i,j]
                v₁[i,j] = γ_vec[i]/(γ_vec[i]+δ_vec[j]) + β * (P_success * V_success + P_fail * V_fail)
            end
        end
        V_next = max.(v₀, v₁)
        d      = (v₁.==V_next)
        euc_distance = euclidean(V,V_next)
        max_distance = maximum(abs.(V-V_next))
        V = V_next
        num_iter+=1
        if (num_iter % 50==0) && (print_flag==1)
            @printf("Step: %3i, Euclidean: %1.4e, Max: %1.4e \n",num_iter,euc_distance,max_distance)
        end
    end
    if (num_iter<1000) && (print_flag==1)
        @printf("VFI complete. It took %3i iterations.",num_iter)
    end
    if (num_iter==1000) && (print_flag==1)
        @printf("VFI not completed. Euclidean: %1.4e, Max: %1.4e \n",euc_distance,max_distance)
    end
    
    gr(fmt=png);
    p1 = heatmap(δ_vec,γ_vec,d)
    title!("Policy Function")
    xlabel!(L"\delta")
    ylabel!(L"\gamma")
    p2 = heatmap(δ_vec,γ_vec,V)
    title!("Value function")
    xlabel!(L"\delta")
    ylabel!(L"\gamma")
    
    fig=plot(p1, p2, label=["" ""],size=(1200,500))

    return v₀, v₁, V, d, fig
end

@everywhere function simul_data_infty(N,T,γ,δ,d)
    
    γData = Array{Float64}(zeros(N,T));
    δData = Array{Float64}(zeros(N,T));
    dData = Array{Float64}(zeros(N,T));
    xData = Array{Float64}(zeros(N,T));
    ξ = rand(Beta(γ,δ),N);
    
    γData[:,1] .= γ
    δData[:,1] .= δ
    γ_init = Int(floor(γ))-1
    δ_init = Int(floor(δ))-1
    
    function decision(γ,δ,γ_init,δ_init)
        γ = Int(floor(γ))
        δ = Int(floor(δ))
        return d[γ-γ_init,δ-δ_init]
    end
    
    dData[:,1] = broadcast(decision,γData[:,1],δData[:,1],γ_init,δ_init)
    xData[:,1] = rand.(Bernoulli.(ξ)) .* dData[:,1];

    for t=2:T
        γData[:,t] .= (γData[:,t-1].< γ+T) .* (γData[:,t-1] .+ 1 .* xData[:,t-1])         .+ (γData[:,t-1].>= γ+T) .* γData[:,t-1]
        δData[:,t] .= (δData[:,t-1].< δ+T) .* (δData[:,t-1] .+ 1 .* (1 .- xData[:,t-1]))  .+ (δData[:,t-1].>= δ+T) .* δData[:,t-1]
        dData[:,t] .= broadcast(decision,γData[:,t],δData[:,t],γ_init,δ_init)
        xData[:,t] .= rand.(Bernoulli.(ξ)) .* dData[:,t];
    end

    return γData, δData, dData, xData, ξ

end;


Random.seed!(42)
γ=2.3;δ=2.0;w=0.65;β=0.96;N=100_000;T=100;
@time v₀, v₁, V, d, fig = VFI(γ,δ,w,β,T);
γData, δData, dData, xData, ξ = simul_data_infty(N,T,γ,δ,d);

Step:  50, Euclidean: 1.0882e+00, Max: 4.3294e-02 
Step: 100, Euclidean: 1.1451e-01, Max: 5.3323e-03 
Step: 150, Euclidean: 1.1084e-02, Max: 6.3784e-04 
Step: 200, Euclidean: 1.0214e-03, Max: 7.3033e-05 
Step: 250, Euclidean: 8.8779e-05, Max: 7.8271e-06 
Step: 300, Euclidean: 7.1427e-06, Max: 7.5905e-07 
Step: 350, Euclidean: 5.2375e-07, Max: 6.4415e-08 
Step: 400, Euclidean: 3.4869e-08, Max: 4.7434e-09 
Step: 450, Euclidean: 2.1278e-09, Max: 3.0889e-10 
Step: 500, Euclidean: 1.2108e-10, Max: 1.8325e-11 
Step: 550, Euclidean: 6.5458e-12, Max: 1.0161e-12 
Step: 600, Euclidean: 3.4281e-13, Max: 6.0396e-14 
Step: 650, Euclidean: 2.8422e-14, Max: 1.4211e-14 
Step: 700, Euclidean: 3.5527e-15, Max: 3.5527e-15 
VFI complete. It took 706 iterations.  9.524045 seconds (14.81 M allocations: 1.038 GiB, 3.11% gc time, 96.84% compilation time)


# Figures for the Policy/Value Functions
Plots.savefig(fig,"value_policy_dyn_infty")
fig


# Figures for Survival/Harard Rates
t = 1:T;
s = vec(sum(dData,dims=1)/N)[1:T];
h = vcat(0, reduce(vcat,(sum(dData[:,t-1])-sum(dData[:,t]))/sum(dData[:,t-1]) for t=2:T));
survival_fig = plot(t,s,lab="Survival rate")
title!(L"\textrm{Fraction of Agents Survived until } t")
xaxis!(L"t")
yaxis!(L"\textrm{Fraction}")
hazard_fig   = plot(t,h,lab="Hazard rate")
title!(L"\textrm{Quitting at } t \textrm{ Conditional on Trying Until } t")
xaxis!(L"t")
yaxis!(L"\textrm{Fraction}")
survival_hazard = plot(survival_fig, hazard_fig, label=["" ""], size=(1200,500))
Plots.savefig(survival_hazard,"survival_hazard_rate")
survival_hazard


@everywhere function hazard(d, γ, δ)
    h₁ = 1-d[1,1]
    h₂ = 1/(1-h₁) * (
            d[1,1] * γ/(γ+δ) * (1-d[2,1]) +
            d[1,1] * δ/(γ+δ) * (1-d[1,2])
        ) 
    h₃ = 1/(1-h₁) * 1/(1-h₂) * (
            d[1,1] * γ/(γ+δ) * d[2,1] * (γ+1)/(γ+δ+1) * (1-d[3,1])    +
            d[1,1] * γ/(γ+δ) * d[2,1] * (δ  )/(γ+δ+1) * (1-d[2,2])    + 
            d[1,1] * δ/(γ+δ) * d[1,2] * (γ  )/(γ+δ+1) * (1-d[2,2])    +
            d[1,1] * δ/(γ+δ) * d[1,2] * (δ+1)/(γ+δ+1) * (1-d[1,3])
        ) 
    h₄ = 1/(1-h₁) * 1/(1-h₂) * 1/(1-h₃) * (
            d[1,1] * γ/(γ+δ) * d[2,1] * (γ+1)/(γ+δ+1) * d[3,1] * (γ+2)/(γ+δ+2) * (1-d[4,1]) +
            
            d[1,1] * γ/(γ+δ) * d[2,1] * (γ+1)/(γ+δ+1) * d[3,1] * (δ  )/(γ+δ+2) * (1-d[3,2]) +
            d[1,1] * γ/(γ+δ) * d[2,1] * (δ  )/(γ+δ+1) * d[2,2] * (γ+1)/(γ+δ+2) * (1-d[3,2]) +
            d[1,1] * δ/(γ+δ) * d[1,2] * (γ  )/(γ+δ+1) * d[2,2] * (γ+1)/(γ+δ+2) * (1-d[3,2]) +
    
            d[1,1] * δ/(γ+δ) * d[1,2] * (δ+1)/(γ+δ+1) * d[1,3] * (γ  )/(γ+δ+2) * (1-d[2,3]) +
            d[1,1] * δ/(γ+δ) * d[1,2] * (γ  )/(γ+δ+1) * d[2,2] * (δ+1)/(γ+δ+2) * (1-d[2,3]) +
            d[1,1] * γ/(γ+δ) * d[2,1] * (δ  )/(γ+δ+1) * d[2,2] * (δ+1)/(γ+δ+2) * (1-d[2,3]) +
    
            d[1,1] * δ/(γ+δ) * d[1,2] * (δ+1)/(γ+δ+1) * d[1,3] * (δ+2)/(γ+δ+2) * (1-d[1,4])
        )
    h₅ = 1/(1-h₂) * 1/(1-h₃) * 1/(1-h₄)*(
        d[1,1] * γ/(γ+δ) * d[2,1] * (γ+1)/(γ+δ+1) * d[3,1] * (γ+2)/(γ+δ+2) * d[4,1] * (γ+3)/(γ+δ+3) * (1-d[5,1]) +
            
        d[1,1] * γ/(γ+δ) * d[2,1] * (γ+1)/(γ+δ+1) * d[3,1] * (γ+2)/(γ+δ+2) * d[4,1] * (δ  )/(γ+δ+3) * (1-d[4,2]) + 
        d[1,1] * γ/(γ+δ) * d[2,1] * (γ+1)/(γ+δ+1) * d[3,1] * (δ  )/(γ+δ+2) * d[3,2] * (γ+2)/(γ+δ+3) * (1-d[4,2]) + 
        d[1,1] * γ/(γ+δ) * d[2,1] * (δ  )/(γ+δ+1) * d[2,2] * (γ+1)/(γ+δ+2) * d[3,2] * (γ+2)/(γ+δ+3) * (1-d[4,2]) + 
        d[1,1] * δ/(γ+δ) * d[1,2] * (γ  )/(γ+δ+1) * d[2,2] * (γ+1)/(γ+δ+2) * d[3,2] * (γ+2)/(γ+δ+3) * (1-d[4,2]) +
    
        d[1,1] * γ/(γ+δ) * d[2,1] * (γ+1)/(γ+δ+1) * d[3,1] * (δ  )/(γ+δ+2) * d[3,2] * (δ+1)/(γ+δ+3) * (1-d[3,3]) + 
        d[1,1] * γ/(γ+δ) * d[2,1] * (δ  )/(γ+δ+1) * d[2,2] * (γ+1)/(γ+δ+2) * d[3,2] * (δ+1)/(γ+δ+3) * (1-d[3,3]) + 
        d[1,1] * γ/(γ+δ) * d[2,1] * (δ  )/(γ+δ+1) * d[2,2] * (δ+1)/(γ+δ+2) * d[2,3] * (γ+1)/(γ+δ+3) * (1-d[3,3]) + 
        d[1,1] * δ/(γ+δ) * d[1,2] * (δ+1)/(γ+δ+1) * d[1,3] * (γ  )/(γ+δ+2) * d[2,3] * (γ+1)/(γ+δ+3) * (1-d[3,3]) + 
        d[1,1] * δ/(γ+δ) * d[1,2] * (γ  )/(γ+δ+1) * d[2,2] * (δ+1)/(γ+δ+2) * d[2,3] * (γ+1)/(γ+δ+3) * (1-d[3,3]) + 
        d[1,1] * δ/(γ+δ) * d[1,2] * (γ  )/(γ+δ+1) * d[2,2] * (γ+1)/(γ+δ+2) * d[3,2] * (δ+1)/(γ+δ+3) * (1-d[3,3]) +
    
        d[1,1] * γ/(γ+δ) * d[2,1] * (δ  )/(γ+δ+1) * d[2,2] * (δ+1)/(γ+δ+2) * d[2,3] * (δ+2)/(γ+δ+3) * (1-d[2,4]) + 
        d[1,1] * δ/(γ+δ) * d[1,2] * (γ  )/(γ+δ+1) * d[2,2] * (δ+1)/(γ+δ+2) * d[2,3] * (δ+2)/(γ+δ+3) * (1-d[2,4]) + 
        d[1,1] * δ/(γ+δ) * d[1,2] * (δ+1)/(γ+δ+1) * d[1,3] * (γ  )/(γ+δ+2) * d[2,3] * (δ+2)/(γ+δ+3) * (1-d[2,4]) + 
        d[1,1] * δ/(γ+δ) * d[1,2] * (δ+1)/(γ+δ+1) * d[1,3] * (δ+2)/(γ+δ+2) * d[1,4] * (γ  )/(γ+δ+3) * (1-d[2,4]) +
        
        d[1,1] * δ/(γ+δ) * d[1,2] * (δ+1)/(γ+δ+1) * d[1,3] * (δ+2)/(γ+δ+2) * d[1,4] * (δ+3)/(γ+δ+3) * (1-d[1,5])
    )
      return h₁, h₂, h₃, h₄, h₅
end;


@everywhere function logLikelihood_infty(log_γ,δ,w,β,T,qData,time)
      γ = exp(log_γ[1])
      v₀, v₁, _, _, _= VFI(γ,δ,w,β,T,print_flag=0);
      h₁, h₂, h₃, h₄, h₅ = hazard(d, γ, δ)
      if time ==2 
            return -sum(log.((qData.==0).*(  h₁) .+ 
                             (qData.==1).*(1-h₁).*(  h₂) .+ 
                             (qData.==2).*(1-h₁).*(1-h₂)))
      elseif time ==3
            return -sum(log.((qData.==0).*(  h₁) .+ 
                             (qData.==1).*(1-h₁).*(  h₂) .+ 
                             (qData.==2).*(1-h₁).*(1-h₂).*(  h₃) .+ 
                             (qData.==3).*(1-h₁).*(1-h₂).*(1-h₃)))
      elseif time ==4
            return -sum(log.((qData.==0).*(  h₁) .+ 
                             (qData.==1).*(1-h₁).*(  h₂) .+ 
                             (qData.==2).*(1-h₁).*(1-h₂).*(  h₃) .+
                             (qData.==3).*(1-h₁).*(1-h₂).*(1-h₃).*(  h₄) .+
                             (qData.==4).*(1-h₁).*(1-h₂).*(1-h₃).*(1-h₄))) 
      else # time ==5 
            return -sum(log.((qData.==0).*(  h₁) .+ 
                             (qData.==1).*(1-h₁).*(  h₂) .+ 
                             (qData.==2).*(1-h₁).*(1-h₂).*(  h₃) .+
                             (qData.==3).*(1-h₁).*(1-h₂).*(1-h₃).*(  h₄) .+
                             (qData.==4).*(1-h₁).*(1-h₂).*(1-h₃).*(1-h₄).*(  h₅) .+
                             (qData.==5).*(1-h₁).*(1-h₂).*(1-h₃).*(1-h₄).*(1-h₅)))
      end
end;


@everywhere function simul_data_infty(N,T,γ,δ,d,Tdata)
    # N: the number of agents
    # T: the time horizon we wish to do VFI
    # γ, δ: structural parameters
    # d: decision rule
    # Tdata: the last time period we wish to simulate data
    γData = Array{Float64}(zeros(N,Tdata));
    δData = Array{Float64}(zeros(N,Tdata));
    dData = Array{Float64}(zeros(N,Tdata));
    xData = Array{Float64}(zeros(N,Tdata));
    ξ = rand(Beta(γ,δ),N);
    
    γData[:,1] .= γ
    δData[:,1] .= δ
    γ_init = Int(floor(γ))-1
    δ_init = Int(floor(δ))-1
    
    function decision(γ,δ,γ_init,δ_init)
        γ = Int(floor(γ))
        δ = Int(floor(δ))
        return d[γ-γ_init,δ-δ_init]
    end
    
    dData[:,1] = broadcast(decision,γData[:,1],δData[:,1],γ_init,δ_init)
    xData[:,1] = rand.(Bernoulli.(ξ)) .* dData[:,1];

    for t=2:Tdata
        γData[:,t] = (dData[:,t-1].==1) .* ((γData[:,t-1].< γ+T) .* (γData[:,t-1] .+ 1 .* xData[:,t-1]) .+ (γData[:,t-1].>= γ+T) .* γData[:,t-1]) +
                     (dData[:,t-1].==0) .* γData[:,t-1]
        δData[:,t] = (dData[:,t-1].==1) .* ((δData[:,t-1].< δ+T) .* (δData[:,t-1] .+ 1 .* (1 .- xData[:,t-1]))  .+ (δData[:,t-1].>= δ+T) .* δData[:,t-1]) +
                     (dData[:,t-1].==0) .* δData[:,t-1]
        dData[:,t] = broadcast(decision,γData[:,t],δData[:,t],γ_init,δ_init)
        xData[:,t] = rand.(Bernoulli.(ξ)) .* dData[:,t];
    end

    return γData, δData, dData, xData, ξ

end;


N_vec = [500,5_000,50_000,500_000,5_000_000];Tdata=5;
_, _, dData, _, _ = simul_data_infty(N_vec[end],T,γ,δ,d,Tdata);
h_vec = hazard(d, γ, δ)

@everywhere begin
    γ=2.3;δ=2.0;w=0.65;β=0.96;T=100;
    v₀, v₁, V, d, _ = VFI(γ,δ,w,β,T,print_flag=0);
    Random.seed!(42)    
    deviation = randn()
    γ_init = [log(γ+deviation/2)]
    lb, ub = log(0.1), log(γ+abs(deviation+2))
    lb_ub = TwiceDifferentiableConstraints([lb],[ub]);
end

h_rate_infty = SharedArray{Float64}(zeros(length(N_vec),4));
result_infty = SharedArray{Float64}(zeros(length(N_vec),4,2));

@time @sync @distributed for i = 1:length(N_vec)
    N = N_vec[i]
    h_rate_infty[i,1] = sum((dData[1:N,1].==1).&(dData[1:N,2].==0))/sum((dData[1:N,1].==1))
    h_rate_infty[i,2] = sum((dData[1:N,2].==1).&(dData[1:N,3].==0))/sum((dData[1:N,2].==1))
    h_rate_infty[i,3] = sum((dData[1:N,3].==1).&(dData[1:N,4].==0))/sum((dData[1:N,3].==1))
    h_rate_infty[i,4] = sum((dData[1:N,4].==1).&(dData[1:N,5].==0))/sum((dData[1:N,4].==1))
    for t = 2:Tdata
        qData = sum(dData[1:N,1:t],dims=2);
        func = TwiceDifferentiable(γ -> logLikelihood_infty(γ[1],δ,w,β,T,qData,t),[γ]);
        opt = optimize(func, lb_ub, γ_init, IPNewton())
        @printf("N=%7i using information up to t=%1i is done! \n",N,t)
        γ_hat_optim = exp(opt.minimizer[1])
        σ_hat_optim = sqrt(inv(hessian!(func,opt.minimizer)))[1]
        result_infty[i,t-1,1] = γ_hat_optim
        result_infty[i,t-1,2] = σ_hat_optim
    end
end


# Print MLE estimation results
print("------------ Estimating γ in an Infinite Horizon Model -------------\n")
print("Parameters: γ=$γ, δ=$δ, w=$w, β=$β \n")
@printf("Initial Point: %1.4f, Lower bound  : %1.4f, Upper bound: %1.4f \n", exp(γ_init[1]), exp(lb), exp(ub))
@printf("Hazard Rate: Data vs Theory \n")
print("=====================================================================\n")
@printf("N     ||"); [@printf(" %7i |", i) for i in N_vec]; @printf("|  Theory |\n") 
print("---------------------------------------------------------------------\n")
for t=1:4
    print("h$(t+1)    ||"); [@printf(" %1.5f |", i) for i in h_rate_infty[:,t]]; @printf("| %1.5f |\n",h_vec[t+1])
end
print("=====================================================================\n")
@printf("Estimation Result: \n")
print("==============================================================\n")
@printf("Data \\ N  ||"); [@printf(" %7i |", i) for i in N_vec]; @printf("\n")
print("--------------------------------------------------------------\n")
for t = 1:4
    print("Up to t=$(t+1) ||"); [@printf(" %1.5f |", i) for i in result_infty[:,t,1]]; @printf("\n")
    print("          ||"); [@printf("(%1.5f)|", i) for i in result_infty[:,t,2]]; @printf("\n")
end
print("==============================================================\n")
@printf("Standard errors in parentheses.")

------------ Estimating γ in an Infinite Horizon Model -------------
Parameters: γ=2.3, δ=2.0, w=0.65, β=0.96 
Initial Point: 2.6942, Lower bound  : 0.1000, Upper bound: 5.0884 
Hazard Rate: Data vs Theory 
=====================================================================
N     ||     500 |    5000 |   50000 |  500000 | 5000000 ||  Theory |
---------------------------------------------------------------------
h2    || 0.45400 | 0.47060 | 0.46274 | 0.46459 | 0.46495 || 0.46512 |
h3    || 0.00000 | 0.00000 | 0.00000 | 0.00000 | 0.00000 || 0.00000 |
h4    || 0.16484 | 0.18209 | 0.17950 | 0.17929 | 0.17972 || 0.17969 |
h5    || 0.19737 | 0.20554 | 0.19577 | 0.19744 | 0.19835 || 0.19805 |
=====================================================================
Estimation Result: 
==============================================================
Data \ N  ||     500 |    5000 |   50000 |  500000 | 5000000 |
--------------------------------------------------------------
Up to t=2 || 2.40529 | 2.24989 | 2.32208 | 2.30491 | 2.30152 |
          ||(0.08982)|(0.02833)|(0.00897)|(0.00284)|(0.00090)|
Up to t=3 || 2.40529 | 2.24989 | 2.32208 | 2.30491 | 2.30152 |
          ||(0.08982)|(0.02833)|(0.00897)|(0.00284)|(0.00090)|
Up to t=4 || 2.43966 | 2.25264 | 2.31765 | 2.30529 | 2.30108 |
          ||(0.07865)|(0.02490)|(0.00786)|(0.00249)|(0.00079)|
Up to t=5 || 2.42519 | 2.24268 | 2.32054 | 2.30601 | 2.30036 |
          ||(0.07401)|(0.02356)|(0.00743)|(0.00235)|(0.00074)|
==============================================================
Standard errors in parentheses.


γ=2.3;δ=2.0;w=0.65;β=0.96;T=100;
N=5000;iter=50000;Tdata=5;
v₀, v₁, V, d, _ = VFI(γ,δ,w,β,T,print_flag=0);
h_vec_check = hazard(d, γ, δ)
h_rate_simul=SharedArray{Float64}(zeros(iter,4))
Random.seed!(42)
@time @sync @distributed for n = 1:iter
    γData, δData, dData, xData, ξ = simul_data_infty(N,T,γ,δ,d,Tdata);
    for t = 1:4
        h_rate_simul[n,t] = sum((dData[:,t].==1).&(dData[:,t+1].==0))/sum((dData[:,t].==1))
    end
end;

 83.480044 seconds (77.91 k allocations: 4.122 MiB, 0.06% compilation time)


# Checking whether the simulation is sensible
print("--- Validating the Simulation of $N Observations with $iter Iterations ---\n")
for t in 1:4
    print("h$(t+1) ");@printf("%3.6f, h2_data: %3.6f \n",h_vec_check[t+1],mean(h_rate_simul[:,t]))
end

--- Validating the Simulation of 5000 Observations with 50000 Iterations ---
h2 0.465116, h2_data: 0.465092 
h3 0.000000, h2_data: 0.000000 
h4 0.179695, h2_data: 0.179677 
h5 0.198052, h2_data: 0.198025

Structural Econometrics - Assignment 1 Tutorial¶

Author: Jaepil Lee¶

October 21, 2021¶

Preliminary: Beta Distribution and Conjugate Prior ¶

Static Problem ¶

Dynamic Problem: 2 periods ¶

Dynamic Problem: Infinite horizon ¶

Preliminary: Beta Distribution and Conjugate Prior ¶

Static problem ¶

Dynamic Problem: 2 Periods ¶

Dynamic Problem: Infinite Horizon ¶

VFI¶

Data simulation¶

Hazard Rate and MLE¶

Appendix: Sanity check for simulation for the infinite horizon model¶