
function pull_arm!(Dist::String, arm::Int64, pull_times::Int64,marms::AbstractVector, npulls::AbstractVector, true_mean::AbstractVector)
    npulls[arm] += pull_times
    ta = true_mean[arm]
    if Dist == "Normal"
        reward = sum(rand(Normal(ta, 0.2), pull_times))
    elseif Dist == "Bernoulli"
        reward = sum(rand(Bernoulli(ta), pull_times))
    elseif Dist == "Poisson"
        reward = sum(rand(Poisson(ta), pull_times))
    elseif Dist == "Power"
        reward = sum(rand(Kumaraswamy(1/(1/ta - 1), 1),pull_times))
    elseif Dist == "Exponential"
        reward = sum(rand(Exponential(ta), pull_times))
    elseif Dist == "Deterministic"
        reward = ta*pull_times
    end
    marms[arm] += reward
    return marms, npulls
end

function pull_arm!(Dist::String, arms::Vector{Int64}, pull_times::Int64,marms::AbstractVector, npulls::AbstractVector, true_mean::AbstractVector)
    npulls[arms] .+= pull_times
    for arm in arms
        ta = true_mean[arm]
        if Dist == "Normal"
            reward = sum(rand(Normal(ta, 0.2), pull_times))
        elseif Dist == "Bernoulli"
            reward = sum(rand(Bernoulli(ta), pull_times))
        elseif Dist == "Poisson"
            reward = sum(rand(Poisson(ta), pull_times))
        elseif Dist == "Power"
            reward = sum(rand(Kumaraswamy(1/(1/ta - 1), 1),pull_times))
        elseif Dist == "Exponential"
            reward = sum(rand(Exponential(ta), pull_times))
        elseif Dist == "Deterministic"
            reward = ta*pull_times
        end
        marms[arm] += reward
    end
    return marms, npulls
end

function pull_arm!(Dist::String, arm::Arm; pull_times::Int = 1) ## For BSH
    if Dist == "Normal"
        reward = sum(rand(Normal(arm.avg_reward, 0.2), pull_times))
    elseif Dist == "Bernoulli"
        reward = sum(rand(Bernoulli(arm.avg_reward), pull_times))
    elseif Dist == "Poisson"
        reward = sum(rand(Poisson(arm.avg_reward), pull_times))
    elseif Dist == "Power"
        reward = sum(rand(Kumaraswamy(1/(1/arm.avg_reward - 1), 1),pull_times))
    elseif Dist == "Exponential"
        reward = sum(rand(Exponential(arm.avg_reward), pull_times))
    elseif Dist == "Deterministic"
        reward = arm.avg_reward*pull_times
    end
    arm.eprc_reward = (arm.eprc_reward * arm.num_pulls + reward) / (arm.num_pulls + pull_times)
    arm.num_pulls += pull_times
end
