# Importing packages...
using Pkg; Pkg.activate("./..")
using Distributions, Statistics, Random,
    LinearAlgebra, Distances, SharedArrays, 
    Optim, ForwardDiff, NLSolversBase, 
    Plots, Printf, LaTeXStrings, PlotThemes;
#=
Distributed.jl is used for parallelization
@everywhere is a macro to tell all the processors do the commands that follows
@distributed is a macro to tell all the processors share the work on the loop
SharedArrays{T} type is a type of Arrays that multiple processors can have access
@sync is a macro to tell the processors do the loop in a synchronized manner
=#
using Distributed; addprocs(15); # Use addprocs(N-1) to use all N processors in your PC.
@everywhere begin
    using Pkg; Pkg.activate("./..")
    using Distributions, Statistics, Random,
        LinearAlgebra, Distances, SharedArrays, 
        Optim, ForwardDiff, NLSolversBase, 
        Plots, Printf, LaTeXStrings, PlotThemes;
end;


function d_static(γ,δ,w)
    # Decision rule in a static case
    if γ/(γ+δ)>w
        return 1
    else
        return 0
    end
end;

Random.seed!(42) # This sets the seed for RNG so that we get the same result.
γ = 3.0; δ = 1.0; w = 10.5; N = 10_000;
γData = Array{Float64}(zeros(N,1));
δData = Array{Float64}(zeros(N,1));
dData = Array{Float64}(zeros(N,1));
xData = Array{Float64}(zeros(N,1));
for i=1:N
    γData[i,1] = γ
    δData[i,1] = δ
    dData[i,1] = d_static(γ,δ,w)
end

# We draw a random number ξ from Beta(γ,δ) N-times.
ξ = rand(Beta(γ,δ),N)

# We flip a coin for each agent *i* whose probability of success is ξ[i].
# We record the result of inventing in xData. 0 in this case means either:
#   i)  the agent tried inventing and failed, or
#   ii) the agent did not try inventing. We need to look at dData to see why we observe 0 here.
# To see what "." does, go to https://julia.quantecon.org/getting_started_julia/julia_by_example.html
xData[:,1] = rand.(Bernoulli.(ξ)) .* dData[:,1];


function u(j,γ,δ,w)
    # Per-period utility function
    return j * γ/(γ+δ) + (1-j) * w
end

function Val_2(γ,δ,w,t,β)
    # The value function for the two-period model
    # findmin(itr)[1] returns maximum value
    if t==2
        return findmax([u(j,γ,δ,w) for j=0:1])[1]
    else
        return findmax([u(j,γ,δ,w) + β*(j*(γ/(γ+δ) * Val_2(γ+1,δ,w,t+1,β) + δ/(γ+δ) * Val_2(γ,δ+1,w,t+1,β))+
                                        (1-j)*Val_2(γ,δ,w,t+1,β)) for j=0:1])[1]
    end
end

function d_dyn_2(γ,δ,w,t,β)
    # The policy function for the two-period model
    # findmin(itr)[2] is argmax. "-1" is there to match the index in Julia (1,2) to our choice index (0,1)
    if t==2
        return findmax([u(j,γ,δ,w) for j=0:1])[2]-1 
    else
        return findmax([u(j,γ,δ,w) + β*(j*(γ/(γ+δ) * Val_2(γ+1,δ,w,t+1,β) + δ/(γ+δ) * Val_2(γ,δ+1,w,t+1,β))+
                                        (1-j)*Val_2(γ,δ,w,t+1,β)) for j=0:1])[2]-1
    end
end

function simul_data(N,T,γ,δ,w,β)
    γData = Array{Float64}(zeros(N,T));
    δData = Array{Float64}(zeros(N,T));
    dData = Array{Float64}(zeros(N,T));
    xData = Array{Float64}(zeros(N,T));
    
    #=
    Again, everyone has different ξ, but each person retains ξ over time (i.e., no learning by doing).
    We only get to know 'how good we are' as we invent and observe outcomes.
    =#
    γData[:,1] .= γ;
    δData[:,1] .= δ;
    ξ = rand(Beta(γ,δ),N);

    #=
    broadcast() applies the function d_dyn_2 that takes 4 scalar arguments and
    applies it element-wise over the vectors γData[:,1] and δData[:,1]
    while fixing w,1,β as scalars.
    =#
    dData[:,1] = broadcast(d_dyn_2,γData[:,1],δData[:,1],w,1,β);
    xData[:,1] = rand.(Bernoulli.(ξ)) .* dData[:,1];
    for t=2:T
        γData[:,t] .= γData[:,t-1] + dData[:,t-1] .* (1 .* xData[:,t-1])
        δData[:,t] .= δData[:,t-1] + dData[:,t-1] .* (1 .* (1 .- xData[:,t-1]))
        dData[:,t] .= broadcast(d_dyn_2,γData[:,t],δData[:,t],w,t,β)
        xData[:,t] .= rand.(Bernoulli.(ξ)) .* dData[:,t];
    end
    return γData, δData, dData, xData, ξ
end;


γ=2.3; δ=2.0; β=0.96;
w⃰ = (γ/(γ+δ))*(1+β*(γ+1)/(γ+δ+1))/(1+β*γ/(γ+δ))
cvf = [(u(j,γ,δ,w⃰) + β*(j*(γ/(γ+δ) * Val_2(γ+1,δ,w⃰,2,β) + δ/(γ+δ) * Val_2(γ,δ+1,w⃰,2,β))+
                        (1-j)*Val_2(γ,δ,w⃰,2,β))) for j=0:1];


# Print CVF when w=w⃰
print("w⃰: ",w⃰,"\n")
print("Choice-specific Conditional Value Function at t=1 when γ=$γ, δ=$δ, β=$β, w=w⃰ \n")
@printf(" - v₀(γ,δ,w⃰,1,β) = %1.12f \n",cvf[1])
@printf(" - v₁(γ,δ,w⃰,1,β) = %1.12f",cvf[2])

w⃰: 0.5646577217010124
Choice-specific Conditional Value Function at t=1 when γ=2.3, δ=2.0, β=0.96, w=w⃰ 
 - v₀(γ,δ,w⃰,1,β) = 1.106729134534 
 - v₁(γ,δ,w⃰,1,β) = 1.106729134534


function logLikelihood(γ,δ,dData)
    γ = γ[1]
    return -sum(dData[:,2].*(log(γ)-log(γ+δ)).+(1.0 .- dData[:,2]).*(log(δ)-log(γ+δ)))
end

function γ_estimation(γ,δ,dData)
    N = size(dData)[1]
    γhat = (δ * sum(dData[:,2])) / (N-sum(dData[:,2]))
    I   = δ / (γhat * (γhat+δ))
    I_n = N * δ / (γhat*(γhat+δ)^2)
    se  = sqrt(1 / I_n)
    return γhat, se
end;


Random.seed!(42)
T=2;γ=3.0;δ=2.0;w=0.55;β=0.96;
N_vec = [50,500,10_000,100_000,500_000]
result_2 = Array{Float64}(zeros(length(N_vec),2,2))
h_rate_2 = Vector{Float64}(zeros(length(N_vec)))
_, _, dData, _, _ = simul_data(N_vec[end],T,γ,δ,w,β);
for i=1:length(N_vec)
    N = N_vec[i]
    h_rate_2[i] = sum((dData[1:N,1].==1).&(dData[1:N,2].==0))/sum((dData[1:N,1].==1))
    result_2[i,1,1], result_2[i,1,2] = γ_estimation(γ,δ,dData[1:N,:])
    # We can also use Optim.jl to tell the program to find the MLE estimate for us
    func = TwiceDifferentiable(x -> logLikelihood(x[1],δ,dData[1:N,:]),[1.0]);
    optim = optimize(func,[1.0])
    result_2[i,2,1] = optim.minimizer[1]
    result_2[i,2,2] = sqrt(inv(Optim.hessian!(func,optim.minimizer)))[1]
end


# Print MLE estimation results
print("---------------- Estimating γ in a Two-Period Model -----------------\n")
print("Parameters: γ=$γ, δ=$δ, w=$w, β=$β, T=$T \n")
@printf("Hazard Rate: Data vs Theory \n")
print("=====================================================================\n")
@printf("N     ||"); [@printf(" %7i |", i) for i in N_vec]; @printf("|  Theory |\n") 
@printf("h₂    ||"); [@printf(" %1.5f |", i) for i in h_rate_2[:]]; @printf("| %1.5f |\n",δ/(γ+δ))
print("=====================================================================\n")

@printf("Estimation Result: \n")
print("=============================================================\n")
@printf("MLE \\ N  ||"); [@printf(" %7i |", i) for i in N_vec]; @printf("\n")
print("-------------------------------------------------------------\n")
@printf("By hand  ||"); [@printf(" %1.5f |", i) for i in result_2[:,1,1]]; @printf("\n")
@printf("         ||"); [@printf("(%1.5f)|", i) for i in result_2[:,1,2]]; @printf("\n")
print("-------------------------------------------------------------\n")
@printf("Optim.jl ||"); [@printf(" %1.5f |", i) for i in result_2[:,2,1]]; @printf("\n")
@printf("         ||"); [@printf("(%1.5f)|", i) for i in result_2[:,2,2]]; @printf("\n")
print("=============================================================\n")
@printf("Standard errors in parentheses.")

---------------- Estimating γ in a Two-Period Model -----------------
Parameters: γ=3.0, δ=2.0, w=0.55, β=0.96, T=2 
Hazard Rate: Data vs Theory 
=====================================================================
N     ||      50 |     500 |   10000 |  100000 |  500000 ||  Theory |
h₂    || 0.42000 | 0.43200 | 0.40500 | 0.40036 | 0.39947 || 0.40000 |
=====================================================================
Estimation Result: 
=============================================================
MLE \ N  ||      50 |     500 |   10000 |  100000 |  500000 |
-------------------------------------------------------------
By hand  || 2.76190 | 2.62963 | 2.93827 | 2.99550 | 3.00663 |
         ||(0.79138)|(0.23741)|(0.05986)|(0.01933)|(0.00868)|
-------------------------------------------------------------
Optim.jl || 2.76190 | 2.62963 | 2.93827 | 2.99550 | 3.00663 |
         ||(0.79138)|(0.23741)|(0.05986)|(0.01933)|(0.00868)|
=============================================================
Standard errors in parentheses.


@everywhere function VFI(γ,δ,w,β,T;print_flag=1)
    γ_vec = collect(γ:γ+T);
    δ_vec = collect(δ:δ+T);
    V  = Matrix{Float64}( w/(1-β) .* ones(length(γ_vec),length(δ_vec)));
    v₀ = Matrix{Float64}(zeros(length(γ_vec),length(δ_vec)));
    v₁ = Matrix{Float64}(zeros(length(γ_vec),length(δ_vec)));
    d  = Matrix{Float64}(zeros(length(γ_vec),length(δ_vec)));
    max_distance = 1.0
    euc_distance = 1.0
    num_steps = 0
    tol = 1e-16
    max_steps = 2000
    while (max_distance>tol && euc_distance>tol && num_steps<=2000)
        # initialization
        V_next = Matrix{Float64}(zeros(length(γ_vec),length(δ_vec)));
        for i = 1:length(γ_vec)
            for j = 1:length(δ_vec)
                # we clip the value function if we reach the boundary of the grid
                if i+1 < length(γ_vec)
                    V_success = V[i+1,j]
                else
                    V_success = V[i,j]
                end
                if j+1 < length(δ_vec)
                    V_fail = V[i,j+1]
                else
                    V_fail = V[i,j]
                end
                # Probability of success and fail
                P_success = γ_vec[i]/(γ_vec[i]+δ_vec[j])
                P_fail = δ_vec[j]/(γ_vec[i]+δ_vec[j])
                # Conditional value functions
                v₀[i,j] = w + β * V[i,j]
                v₁[i,j] = γ_vec[i]/(γ_vec[i]+δ_vec[j]) + β * (P_success * V_success + P_fail * V_fail)
            end
        end
        V_next = max.(v₀, v₁)
        d      = (v₁.==V_next)
        euc_distance = euclidean(V,V_next)
        max_distance = maximum(abs.(V-V_next))
        V = V_next
        num_steps+=1
        if (num_steps % 50==0) && (print_flag==1)
            @printf("Step: %3i, Euclidean: %1.4e, Max: %1.4e \n",num_steps,euc_distance,max_distance)
        end
    end
    if (num_steps<1000) && (print_flag==1)
        @printf("VFI complete. It took %3i steps.",num_steps)
    end
    if (num_steps==1000) && (print_flag==1)
        @printf("VFI not completed. Euclidean: %1.4e, Max: %1.4e \n",euc_distance,max_distance)
    end
    
    gr(fmt=png);
    p1 = heatmap(δ_vec,γ_vec,d)
    title!("Policy Function")
    xlabel!(L"\delta")
    ylabel!(L"\gamma")
    p2 = heatmap(δ_vec,γ_vec,V)
    title!("Value function")
    xlabel!(L"\delta")
    ylabel!(L"\gamma")
    
    fig=plot(p1, p2, label=["" ""],size=(1200,500))

    return v₀, v₁, V, d, fig
end

@everywhere function simul_data_infty(N,T,γ,δ,d)
    
    γData = Array{Float64}(zeros(N,T));
    δData = Array{Float64}(zeros(N,T));
    dData = Array{Float64}(zeros(N,T));
    xData = Array{Float64}(zeros(N,T));
    ξ = rand(Beta(γ,δ),N);
    
    γData[:,1] .= γ
    δData[:,1] .= δ
    γ_init = Int(floor(γ))-1
    δ_init = Int(floor(δ))-1
    
    function decision(γ,δ,γ_init,δ_init)
        γ = Int(floor(γ))
        δ = Int(floor(δ))
        return d[γ-γ_init,δ-δ_init]
    end
    
    dData[:,1] = broadcast(decision,γData[:,1],δData[:,1],γ_init,δ_init)
    xData[:,1] = rand.(Bernoulli.(ξ)) .* dData[:,1];

    for t=2:T
        γData[:,t] .= (γData[:,t-1].< γ+T) .* (γData[:,t-1] .+ 1 .* xData[:,t-1])         .+ (γData[:,t-1].>= γ+T) .* γData[:,t-1]
        δData[:,t] .= (δData[:,t-1].< δ+T) .* (δData[:,t-1] .+ 1 .* (1 .- xData[:,t-1]))  .+ (δData[:,t-1].>= δ+T) .* δData[:,t-1]
        dData[:,t] .= broadcast(decision,γData[:,t],δData[:,t],γ_init,δ_init)
        xData[:,t] .= rand.(Bernoulli.(ξ)) .* dData[:,t];
    end

    return γData, δData, dData, xData, ξ

end;


Random.seed!(42)
γ=2.3;δ=2.0;w=0.65;β=0.96;N=100_000;T=100;
@time v₀, v₁, V, d, fig = VFI(γ,δ,w,β,T);
γData, δData, dData, xData, ξ = simul_data_infty(N,T,γ,δ,d);

Step:  50, Euclidean: 1.0882e+00, Max: 4.3294e-02 
Step: 100, Euclidean: 1.1451e-01, Max: 5.3323e-03 
Step: 150, Euclidean: 1.1084e-02, Max: 6.3784e-04 
Step: 200, Euclidean: 1.0214e-03, Max: 7.3033e-05 
Step: 250, Euclidean: 8.8779e-05, Max: 7.8271e-06 
Step: 300, Euclidean: 7.1427e-06, Max: 7.5905e-07 
Step: 350, Euclidean: 5.2375e-07, Max: 6.4415e-08 
Step: 400, Euclidean: 3.4869e-08, Max: 4.7434e-09 
Step: 450, Euclidean: 2.1278e-09, Max: 3.0889e-10 
Step: 500, Euclidean: 1.2108e-10, Max: 1.8325e-11 
Step: 550, Euclidean: 6.5458e-12, Max: 1.0161e-12 
Step: 600, Euclidean: 3.4281e-13, Max: 6.0396e-14 
Step: 650, Euclidean: 2.8422e-14, Max: 1.4211e-14 
Step: 700, Euclidean: 3.5527e-15, Max: 3.5527e-15 
VFI complete. It took 706 steps.  0.324813 seconds (24.48 k allocations: 280.895 MiB)


# Figures for the Policy/Value Functions
Plots.savefig(fig,"value_policy_dyn_infty")
fig


# Figures for Survival/Harard Rates
t = 1:T;
s = vec(sum(dData,dims=1)/N)[1:T];
h = vcat(0, reduce(vcat,(sum(dData[:,t-1])-sum(dData[:,t]))/sum(dData[:,t-1]) for t=2:T));
survival_fig = plot(t,s,lab="Survival rate")
title!(L"\textrm{Fraction of Agents Survived until } t")
xaxis!(L"t")
yaxis!(L"\textrm{Fraction}")
hazard_fig   = plot(t,h,lab="Hazard rate")
title!(L"\textrm{Quitting at } t \textrm{ Conditional on Trying Until } t")
xaxis!(L"t")
yaxis!(L"\textrm{Fraction}")
survival_hazard = plot(survival_fig, hazard_fig, label=["" ""], size=(1200,500))
Plots.savefig(survival_hazard,"survival_hazard_rate")
survival_hazard


@everywhere function hazard(d, γ, δ)
    h₁ = 1-d[1,1]
    h₂ = 1/(1-h₁) * (
            d[1,1] * γ/(γ+δ) * (1-d[2,1]) +
            d[1,1] * δ/(γ+δ) * (1-d[1,2])
        ) 
    h₃ = 1/(1-h₁) * 1/(1-h₂) * (
            d[1,1] * γ/(γ+δ) * d[2,1] * (γ+1)/(γ+δ+1) * (1-d[3,1])    +
            d[1,1] * γ/(γ+δ) * d[2,1] * (δ  )/(γ+δ+1) * (1-d[2,2])    + 
            d[1,1] * δ/(γ+δ) * d[1,2] * (γ  )/(γ+δ+1) * (1-d[2,2])    +
            d[1,1] * δ/(γ+δ) * d[1,2] * (δ+1)/(γ+δ+1) * (1-d[1,3])
        ) 
    h₄ = 1/(1-h₁) * 1/(1-h₂) * 1/(1-h₃) * (
            d[1,1] * γ/(γ+δ) * d[2,1] * (γ+1)/(γ+δ+1) * d[3,1] * (γ+2)/(γ+δ+2) * (1-d[4,1]) +
            
            d[1,1] * γ/(γ+δ) * d[2,1] * (γ+1)/(γ+δ+1) * d[3,1] * (δ  )/(γ+δ+2) * (1-d[3,2]) +
            d[1,1] * γ/(γ+δ) * d[2,1] * (δ  )/(γ+δ+1) * d[2,2] * (γ+1)/(γ+δ+2) * (1-d[3,2]) +
            d[1,1] * δ/(γ+δ) * d[1,2] * (γ  )/(γ+δ+1) * d[2,2] * (γ+1)/(γ+δ+2) * (1-d[3,2]) +
    
            d[1,1] * δ/(γ+δ) * d[1,2] * (δ+1)/(γ+δ+1) * d[1,3] * (γ  )/(γ+δ+2) * (1-d[2,3]) +
            d[1,1] * δ/(γ+δ) * d[1,2] * (γ  )/(γ+δ+1) * d[2,2] * (δ+1)/(γ+δ+2) * (1-d[2,3]) +
            d[1,1] * γ/(γ+δ) * d[2,1] * (δ  )/(γ+δ+1) * d[2,2] * (δ+1)/(γ+δ+2) * (1-d[2,3]) +
    
            d[1,1] * δ/(γ+δ) * d[1,2] * (δ+1)/(γ+δ+1) * d[1,3] * (δ+2)/(γ+δ+2) * (1-d[1,4])
        )
    h₅ = 1/(1-h₂) * 1/(1-h₃) * 1/(1-h₄)*(
        d[1,1] * γ/(γ+δ) * d[2,1] * (γ+1)/(γ+δ+1) * d[3,1] * (γ+2)/(γ+δ+2) * d[4,1] * (γ+3)/(γ+δ+3) * (1-d[5,1]) +
            
        d[1,1] * γ/(γ+δ) * d[2,1] * (γ+1)/(γ+δ+1) * d[3,1] * (γ+2)/(γ+δ+2) * d[4,1] * (δ  )/(γ+δ+3) * (1-d[4,2]) + 
        d[1,1] * γ/(γ+δ) * d[2,1] * (γ+1)/(γ+δ+1) * d[3,1] * (δ  )/(γ+δ+2) * d[3,2] * (γ+2)/(γ+δ+3) * (1-d[4,2]) + 
        d[1,1] * γ/(γ+δ) * d[2,1] * (δ  )/(γ+δ+1) * d[2,2] * (γ+1)/(γ+δ+2) * d[3,2] * (γ+2)/(γ+δ+3) * (1-d[4,2]) + 
        d[1,1] * δ/(γ+δ) * d[1,2] * (γ  )/(γ+δ+1) * d[2,2] * (γ+1)/(γ+δ+2) * d[3,2] * (γ+2)/(γ+δ+3) * (1-d[4,2]) +
    
        d[1,1] * γ/(γ+δ) * d[2,1] * (γ+1)/(γ+δ+1) * d[3,1] * (δ  )/(γ+δ+2) * d[3,2] * (δ+1)/(γ+δ+3) * (1-d[3,3]) + 
        d[1,1] * γ/(γ+δ) * d[2,1] * (δ  )/(γ+δ+1) * d[2,2] * (γ+1)/(γ+δ+2) * d[3,2] * (δ+1)/(γ+δ+3) * (1-d[3,3]) + 
        d[1,1] * γ/(γ+δ) * d[2,1] * (δ  )/(γ+δ+1) * d[2,2] * (δ+1)/(γ+δ+2) * d[2,3] * (γ+1)/(γ+δ+3) * (1-d[3,3]) + 
        d[1,1] * δ/(γ+δ) * d[1,2] * (δ+1)/(γ+δ+1) * d[1,3] * (γ  )/(γ+δ+2) * d[2,3] * (γ+1)/(γ+δ+3) * (1-d[3,3]) + 
        d[1,1] * δ/(γ+δ) * d[1,2] * (γ  )/(γ+δ+1) * d[2,2] * (δ+1)/(γ+δ+2) * d[2,3] * (γ+1)/(γ+δ+3) * (1-d[3,3]) + 
        d[1,1] * δ/(γ+δ) * d[1,2] * (γ  )/(γ+δ+1) * d[2,2] * (γ+1)/(γ+δ+2) * d[3,2] * (δ+1)/(γ+δ+3) * (1-d[3,3]) +
    
        d[1,1] * γ/(γ+δ) * d[2,1] * (δ  )/(γ+δ+1) * d[2,2] * (δ+1)/(γ+δ+2) * d[2,3] * (δ+2)/(γ+δ+3) * (1-d[2,4]) + 
        d[1,1] * δ/(γ+δ) * d[1,2] * (γ  )/(γ+δ+1) * d[2,2] * (δ+1)/(γ+δ+2) * d[2,3] * (δ+2)/(γ+δ+3) * (1-d[2,4]) + 
        d[1,1] * δ/(γ+δ) * d[1,2] * (δ+1)/(γ+δ+1) * d[1,3] * (γ  )/(γ+δ+2) * d[2,3] * (δ+2)/(γ+δ+3) * (1-d[2,4]) + 
        d[1,1] * δ/(γ+δ) * d[1,2] * (δ+1)/(γ+δ+1) * d[1,3] * (δ+2)/(γ+δ+2) * d[1,4] * (γ  )/(γ+δ+3) * (1-d[2,4]) +
        
        d[1,1] * δ/(γ+δ) * d[1,2] * (δ+1)/(γ+δ+1) * d[1,3] * (δ+2)/(γ+δ+2) * d[1,4] * (δ+3)/(γ+δ+3) * (1-d[1,5])
    )
      return h₁, h₂, h₃, h₄, h₅
end;


@everywhere function logLikelihood_infty(log_γ,δ,w,β,T,qData,time)
      γ = exp(log_γ[1])
      v₀, v₁, _, _, _= VFI(γ,δ,w,β,T,print_flag=0);
      h₁, h₂, h₃, h₄, h₅ = hazard(d, γ, δ)
      if time ==2 
            return -sum(log.((qData.==0).*(  h₁) .+ 
                             (qData.==1).*(1-h₁).*(  h₂) .+ 
                             (qData.==2).*(1-h₁).*(1-h₂)))
      elseif time ==3
            return -sum(log.((qData.==0).*(  h₁) .+ 
                             (qData.==1).*(1-h₁).*(  h₂) .+ 
                             (qData.==2).*(1-h₁).*(1-h₂).*(  h₃) .+ 
                             (qData.==3).*(1-h₁).*(1-h₂).*(1-h₃)))
      elseif time ==4
            return -sum(log.((qData.==0).*(  h₁) .+ 
                             (qData.==1).*(1-h₁).*(  h₂) .+ 
                             (qData.==2).*(1-h₁).*(1-h₂).*(  h₃) .+
                             (qData.==3).*(1-h₁).*(1-h₂).*(1-h₃).*(  h₄) .+
                             (qData.==4).*(1-h₁).*(1-h₂).*(1-h₃).*(1-h₄))) 
      else # time ==5 
            return -sum(log.((qData.==0).*(  h₁) .+ 
                             (qData.==1).*(1-h₁).*(  h₂) .+ 
                             (qData.==2).*(1-h₁).*(1-h₂).*(  h₃) .+
                             (qData.==3).*(1-h₁).*(1-h₂).*(1-h₃).*(  h₄) .+
                             (qData.==4).*(1-h₁).*(1-h₂).*(1-h₃).*(1-h₄).*(  h₅) .+
                             (qData.==5).*(1-h₁).*(1-h₂).*(1-h₃).*(1-h₄).*(1-h₅)))
      end
end;


@everywhere function simul_data_infty(N,T,γ,δ,d,Tdata)
    # N: the number of agents
    # T: the time horizon we wish to do VFI
    # γ, δ: structural parameters
    # d: decision rule
    # Tdata: the last time period we wish to simulate data
    γData = Array{Float64}(zeros(N,Tdata));
    δData = Array{Float64}(zeros(N,Tdata));
    dData = Array{Float64}(zeros(N,Tdata));
    xData = Array{Float64}(zeros(N,Tdata));
    ξ = rand(Beta(γ,δ),N);
    
    γData[:,1] .= γ
    δData[:,1] .= δ
    γ_init = Int(floor(γ))-1
    δ_init = Int(floor(δ))-1
    
    function decision(γ,δ,γ_init,δ_init)
        γ = Int(floor(γ))
        δ = Int(floor(δ))
        return d[γ-γ_init,δ-δ_init]
    end
    
    dData[:,1] = broadcast(decision,γData[:,1],δData[:,1],γ_init,δ_init)
    xData[:,1] = rand.(Bernoulli.(ξ)) .* dData[:,1];

    for t=2:Tdata
        γData[:,t] = (dData[:,t-1].==1) .* ((γData[:,t-1].< γ+T) .* (γData[:,t-1] .+ 1 .* xData[:,t-1]) .+ (γData[:,t-1].>= γ+T) .* γData[:,t-1]) +
                     (dData[:,t-1].==0) .* γData[:,t-1]
        δData[:,t] = (dData[:,t-1].==1) .* ((δData[:,t-1].< δ+T) .* (δData[:,t-1] .+ 1 .* (1 .- xData[:,t-1]))  .+ (δData[:,t-1].>= δ+T) .* δData[:,t-1]) +
                     (dData[:,t-1].==0) .* δData[:,t-1]
        dData[:,t] = broadcast(decision,γData[:,t],δData[:,t],γ_init,δ_init)
        xData[:,t] = rand.(Bernoulli.(ξ)) .* dData[:,t];
    end

    return γData, δData, dData, xData, ξ

end;


N_vec = [500,5000,50_000,500_000,5_000_000];Tdata=5;
_, _, dData, _, _ = simul_data_infty(N_vec[end],T,γ,δ,d,Tdata);
h₁, h₂, h₃, h₄, h₅ = hazard(d, γ, δ)

@everywhere begin
    γ=2.3;δ=2.0;w=0.65;β=0.96;T=100;
    v₀, v₁, V, d, _ = VFI(γ,δ,w,β,T,print_flag=0);
    Random.seed!(42)    
    deviation = randn()
    γ_init = [log(γ+deviation/2)]
    lb, ub = log(0.1), log(γ+abs(deviation+1))
    lb_ub = TwiceDifferentiableConstraints([lb],[ub]);
end

h_rate_infty = SharedArray{Float64}(zeros(length(N_vec),4));
result_infty = SharedArray{Float64}(zeros(length(N_vec),4,2));

@time @sync @distributed for i = 1:length(N_vec)
    N = N_vec[i]
    h_rate_infty[i,1] = sum((dData[1:N,1].==1).&(dData[1:N,2].==0))/sum((dData[1:N,1].==1))
    h_rate_infty[i,2] = sum((dData[1:N,2].==1).&(dData[1:N,3].==0))/sum((dData[1:N,2].==1))
    h_rate_infty[i,3] = sum((dData[1:N,3].==1).&(dData[1:N,4].==0))/sum((dData[1:N,3].==1))
    h_rate_infty[i,4] = sum((dData[1:N,4].==1).&(dData[1:N,5].==0))/sum((dData[1:N,4].==1))
    for t = 2:Tdata
        qData = sum(dData[1:N,1:t],dims=2);
        func = TwiceDifferentiable(γ -> logLikelihood_infty(γ[1],δ,w,β,T,qData,t),[γ]);
        opt = optimize(func, lb_ub, γ_init, IPNewton())
        @printf("N=%7i using information up to t=%1i is done! \n",N,t)
        γ_hat_optim = exp(opt.minimizer[1])
        σ_hat_optim = sqrt(inv(hessian!(func,opt.minimizer)))[1]
        result_infty[i,t-1,1] = γ_hat_optim
        result_infty[i,t-1,2] = σ_hat_optim
    end
end

      From worker 2:	N=    500 using information up to t=2 is done! 
      From worker 5:	N= 500000 using information up to t=2 is done! 
      From worker 2:	N=    500 using information up to t=3 is done! 
      From worker 3:	N=   5000 using information up to t=2 is done! 
      From worker 4:	N=  50000 using information up to t=2 is done! 
      From worker 5:	N= 500000 using information up to t=3 is done! 
      From worker 6:	N=5000000 using information up to t=2 is done! 
      From worker 3:	N=   5000 using information up to t=3 is done! 
      From worker 2:	N=    500 using information up to t=4 is done! 
      From worker 4:	N=  50000 using information up to t=3 is done! 
      From worker 5:	N= 500000 using information up to t=4 is done! 
      From worker 3:	N=   5000 using information up to t=4 is done! 
      From worker 2:	N=    500 using information up to t=5 is done! 
      From worker 5:	N= 500000 using information up to t=5 is done! 
      From worker 4:	N=  50000 using information up to t=4 is done! 
      From worker 6:	N=5000000 using information up to t=3 is done! 
      From worker 3:	N=   5000 using information up to t=5 is done! 
      From worker 4:	N=  50000 using information up to t=5 is done! 
      From worker 6:	N=5000000 using information up to t=4 is done! 
      From worker 6:	N=5000000 using information up to t=5 is done! 
578.268552 seconds (2.92 M allocations: 171.107 MiB, 0.05% compilation time)

Task (done) @0x000000005bd52bd0


# Print MLE estimation results
print("------------ Estimating γ in an Infinite Horizon Model -------------\n")
print("Parameters: γ=$γ, δ=$δ, w=$w, β=$β \n")
@printf("Initial Point: %1.4f, Lower bound  : %1.4f, Upper bound: %1.4f \n", exp(γ_init[1]), exp(lb), exp(ub))
@printf("Hazard Rate: Data vs Theory \n")
print("=====================================================================\n")
@printf("N     ||"); [@printf(" %7i |", i) for i in N_vec]; @printf("|  Theory |\n") 
print("---------------------------------------------------------------------\n")
@printf("h₂    ||"); [@printf(" %1.5f |", i) for i in h_rate_infty[:,1]]; @printf("| %1.5f |\n",h₂)
@printf("h₃    ||"); [@printf(" %1.5f |", i) for i in h_rate_infty[:,2]]; @printf("| %1.5f |\n",h₃)
@printf("h₄    ||"); [@printf(" %1.5f |", i) for i in h_rate_infty[:,3]]; @printf("| %1.5f |\n",h₄)
@printf("h₅    ||"); [@printf(" %1.5f |", i) for i in h_rate_infty[:,4]]; @printf("| %1.5f |\n",h₅)
print("=====================================================================\n")
@printf("Estimation Result: \n")
print("==============================================================\n")
@printf("Data \\ N  ||"); [@printf(" %7i |", i) for i in N_vec]; @printf("\n")
print("--------------------------------------------------------------\n")
@printf("Up to t=2 ||"); [@printf(" %1.5f |", i) for i in result_infty[:,1,1]]; @printf("\n")
@printf("          ||"); [@printf("(%1.5f)|", i) for i in result_infty[:,1,2]]; @printf("\n")
@printf("Up to t=3 ||"); [@printf(" %1.5f |", i) for i in result_infty[:,2,1]]; @printf("\n")
@printf("          ||"); [@printf("(%1.5f)|", i) for i in result_infty[:,2,2]]; @printf("\n")
@printf("Up to t=4 ||"); [@printf(" %1.5f |", i) for i in result_infty[:,3,1]]; @printf("\n")
@printf("          ||"); [@printf("(%1.5f)|", i) for i in result_infty[:,3,2]]; @printf("\n")
@printf("Up to t=5 ||"); [@printf(" %1.5f |", i) for i in result_infty[:,4,1]]; @printf("\n")
@printf("          ||"); [@printf("(%1.5f)|", i) for i in result_infty[:,4,2]]; @printf("\n")
print("==============================================================\n")
@printf("Standard errors in parentheses.")

------------ Estimating γ in an Infinite Horizon Model -------------
Parameters: γ=2.3, δ=2.0, w=0.65, β=0.96 
Initial Point: 2.0220, Lower bound  : 0.1000, Upper bound: 2.7440 
Hazard Rate: Data vs Theory 
=====================================================================
N     ||     500 |    5000 |   50000 |  500000 | 5000000 ||  Theory |
---------------------------------------------------------------------
h₂    || 0.45600 | 0.47920 | 0.46894 | 0.46448 | 0.46496 || 0.46512 |
h₃    || 0.00000 | 0.00000 | 0.00000 | 0.00000 | 0.00000 || 0.00000 |
h₄    || 0.18382 | 0.17435 | 0.18122 | 0.17989 | 0.17955 || 0.17969 |
h₅    || 0.20270 | 0.18279 | 0.19650 | 0.19856 | 0.19801 || 0.19805 |
=====================================================================
Estimation Result: 
==============================================================
Data \ N  ||     500 |    5000 |   50000 |  500000 | 5000000 |
--------------------------------------------------------------
Up to t=2 || 2.38596 | 2.17362 | 2.26494 | 2.30593 | 2.30146 |
          ||(0.08979)|(0.02831)|(0.00896)|(0.00284)|(0.00090)|
Up to t=3 || 2.38596 | 2.17362 | 2.26494 | 2.30593 | 2.30146 |
          ||(0.08979)|(0.02831)|(0.00896)|(0.00284)|(0.00090)|
Up to t=4 || 2.34939 | 2.21968 | 2.26739 | 2.30384 | 2.30166 |
          ||(0.07828)|(0.02503)|(0.00787)|(0.00249)|(0.00079)|
Up to t=5 || 2.33424 | 2.25803 | 2.27389 | 2.30238 | 2.30157 |
          ||(0.07390)|(0.02378)|(0.00745)|(0.00235)|(0.00074)|
==============================================================
Standard errors in parentheses.


γ=2.3;δ=2.0;w=0.65;β=0.96;T=100;
N=5000;iter=50000;Tdata=5;
v₀, v₁, V, d, _ = VFI(γ,δ,w,β,T,print_flag=0);
h₁, h₂, h₃, h₄, h₅ = hazard(d, γ, δ)
h_rate_simul=SharedArray{Float64}(zeros(iter,4))
Random.seed!(42)
@time @sync @distributed for n = 1:iter
    γData, δData, dData, xData, ξ = simul_data_infty(N,T,γ,δ,d,Tdata);
    h_rate_simul[n,1] = sum((dData[:,1].==1).&(dData[:,2].==0))/sum((dData[:,1].==1))
    h_rate_simul[n,2] = sum((dData[:,2].==1).&(dData[:,3].==0))/sum((dData[:,2].==1))
    h_rate_simul[n,3] = sum((dData[:,3].==1).&(dData[:,4].==0))/sum((dData[:,3].==1))
    h_rate_simul[n,4] = sum((dData[:,4].==1).&(dData[:,5].==0))/sum((dData[:,4].==1))
end;

 37.463248 seconds (234.16 k allocations: 13.107 MiB, 0.24% compilation time)


# Checking whether the simulation is sensible
print("--- Validating the Simulation of $N Observations with $iter Iterations ---\n")
@printf("h2: %3.6f, h2_data: %3.6f \n",h₂,mean(h_rate_simul[:,1]))
@printf("h3: %3.6f, h3_data: %3.6f \n",h₃,mean(h_rate_simul[:,2]))
@printf("h4: %3.6f, h4_data: %3.6f \n",h₄,mean(h_rate_simul[:,3]))
@printf("h5: %3.6f, h5_data: %3.6f \n",h₅,mean(h_rate_simul[:,4]))

--- Validating the Simulation of 5000 Observations with 50000 Iterations ---
h2: 0.465116, h2_data: 0.465035 
h3: 0.000000, h3_data: 0.000000 
h4: 0.179695, h4_data: 0.179722 
h5: 0.198052, h5_data: 0.198077

Structural Econometrics - Assignment 1 Tutorial¶

Author: Jaepil Lee¶

October 21, 2021¶

Preliminary: Beta Distribution and Conjugate Prior ¶

Static Problem ¶

Dynamic Problem: 2 periods ¶

Dyanmic Problem: Infinite horizon ¶

Preliminary: Beta Distribution and Conjugate Prior ¶

Static problem ¶

Dynamic Problem: 2 Periods ¶

Dynamic Problem: Infinite Horizon ¶

VFI¶

Data simulation¶

Hazard Rate and MLE¶

Appendix: Sanity check for simulation for the infinite horizon model¶