flat_test.py

execfile("core.py")
import matplotlib.pyplot as plt
from datetime import datetime
random.seed(datetime.now())


def test1(num_sims, Klist, algo):
    # algo = Racing or LUCB
    if algo == Racing:
        beta = beta_racing
    elif algo == LUCB:
        beta = beta_LUCB
    else:
        print "Wrong algorithm input."
    horizons_mean = np.zeros((len(Klist), 2))
    for kid, k in enumerate(Klist):
        print kid
        m = k/5
        eps = 0.1
        delta = 0.1
        horizons = np.zeros((num_sims,2), dtype=int)
        for sim in range(num_sims):
            means = np.random.random(k)
            arms = map(lambda (mu): BernoulliArm(mu), means)
            caseH = algo(arms, m, eps, delta, beta, Hoeffding)
            caseH.run()
            caseC = algo(arms, m, eps, delta, beta, Chernoff)
            caseC.run()
            horizons[sim,0] = caseH.N
            horizons[sim,1] = caseC.N
            print sim
        horizons_mean[kid] = np.mean(horizons, axis=0)
    return horizons_mean

def test23_LUCB(algo, num_sims, check_points, true_bestarms):
    num_points = len(check_points)
    horizons = np.zeros(num_sims)
    checkpoints = np.zeros((num_sims, num_points), dtype=int)
    checkerrors = np.zeros((num_sims, num_points), dtype=bool)
    for sim in range(num_sims):
        print sim
        algo.initialize()
        algo.set_checkpoints(check_points, true_bestarms)
        algo.run()
        horizons[sim] = algo.N
        checkpoints[sim] = algo.checkpoints
        checkerrors[sim] = algo.checkerrors
    return horizons, checkpoints, checkerrors


## test 1
print "test 1"
num_sims = 10
Klist = range(10,61,10)
horizons_mean_racing = test1(num_sims, Klist, Racing)
horizons_mean_LUCB = test1(num_sims, Klist, LUCB)

# plot test 1
fig = plt.figure()
plt.plot(Klist, horizons_mean_racing[:,0]/10000, 'ko-', label='Racing')
plt.plot(Klist, horizons_mean_racing[:,1]/10000, 'bo-', label='KL-Racing')
plt.plot(Klist, horizons_mean_LUCB[:,0]/10000, 'g^-', label='LUCB')
plt.plot(Klist, horizons_mean_LUCB[:,1]/10000, 'y^-', label='KL-LUCB')
plt.legend(loc='best')
plt.title('Expected sample complexity / 10000')
plt.xlabel('K')
plt.savefig('figure/flat_test1.png', bbox_inches='tight')
plt.close(fig)


## test23
print "test 23"
num_sims = 10
# B1
K = 15
means = np.array([0.5] + map(lambda (a): 0.5-a/40., range(2,K+1)))
n_arms = len(means)
arms = map(lambda (mu): BernoulliArm(mu), means)

m = 3
eps = 0.04
delta = 0.1
caseH_racing = Racing(arms, m, eps, delta, beta_racing, Hoeffding)
caseC_racing = Racing(arms, m, eps, delta, beta_racing, Chernoff)
caseH_LUCB = LUCB(arms, m, eps, delta, beta_lucb, Hoeffding)
caseC_LUCB = LUCB(arms, m, eps, delta, beta_LUCB, Chernoff)
checkpoints = np.arange(1000, 7001, 1000)
true_best_arms = set([0,1,2])
horizonsH1_racing, checkpointsH1_racing, checkerrorsH1_racing = test23(caseH_racing, num_sims, checkpoints, true_best_arms)
horizonsC1_racing, checkpointsC1_racing, checkerrorsC1_racing = test23(caseC_racing, num_sims, checkpoints, true_best_arms)
horizonsH1_LUCB, checkpointsH1_LUCB, checkerrorsH1_LUCB = test23_LUCB(caseH_LUCB, num_sims, checkpoints, true_best_arms)
horizonsC1_LUCB, checkpointsC1_LUCB, checkerrorsC1_LUCB = test23_LUCB(caseC_LUCB, num_sims, checkpoints, true_best_arms)
errorrateH1_racing = np.sum(checkerrorsH1_racing, axis=0)/float(num_sims)
errorrateC1_racing = np.sum(checkerrorsC1_racing, axis=0)/float(num_sims)
errorrateH1_LUCB = np.sum(checkerrorsH1_LUCB, axis=0)/float(num_sims)
errorrateC1_LUCB = np.sum(checkerrorsC1_LUCB, axis=0)/float(num_sims)

# B2
means /= 2
arms = map(lambda (mu): BernoulliArm(mu), means)

m = 3
eps = 0.02
delta = 0.1
caseH_racing = Racing(arms, m, eps, delta, beta_racing, Hoeffding)
caseC_racing = Racing(arms, m, eps, delta, beta_racing, Chernoff)
caseH_LUCB = LUCB(arms, m, eps, delta, beta_LUCB, Hoeffding)
caseC_LUCB = LUCB(arms, m, eps, delta, beta_LUCB, Chernoff)
horizonsH2_racing, checkpointsH2_racing, checkerrorsH2_racing = test23(caseH_racing, num_sims, checkpoints, true_best_arms)
horizonsC2_racing, checkpointsC2_racing, checkerrorsC2_racing = test23(caseC_racing, num_sims, checkpoints, true_best_arms)
horizonsH2_LUCB, checkpointsH2_LUCB, checkerrorsH2_LUCB = test23_LUCB(caseH_LUCB, num_sims, checkpoints, true_best_arms)
horizonsC2_LUCB, checkpointsC2_LUCB, checkerrorsC2_LUCB = test23_LUCB(caseC_LUCB, num_sims, checkpoints, true_best_arms)
errorrateH2_racing = np.sum(checkerrorsH2_racing, axis=0)/float(num_sims)
errorrateC2_racing = np.sum(checkerrorsC2_racing, axis=0)/float(num_sims)
errorrateH2_LUCB = np.sum(checkerrorsH2_LUCB, axis=0)/float(num_sims)
errorrateC2_LUCB = np.sum(checkerrorsC2_LUCB, axis=0)/float(num_sims)

# plot test 2
fig = plt.figure()
plt.subplot(2, 1, 1)
plt.hist(horizonsH1_racing/10000, bins=num_sims/10, range=[2.,22.], normed=True, facecolor='red', align='mid', label='Racing')
plt.hist(horizonsC1_racing/10000, bins=num_sims/10, range=[2.,22.], normed=True, facecolor='green', align='mid', label='KL-Racing')
plt.hist(horizonsH1_LUCB/10000, bins=num_sims/10, range=[2.,22.], normed=True, facecolor='yellow', align='mid', label='LUCB')
plt.hist(horizonsC1_LUCB/10000, bins=num_sims/10, range=[2.,22.], normed=True, facecolor='blue', align='mid', label='KL-LUCB')
plt.legend(loc='best')
plt.title('Fraction of runs (in bins of width 1000)')
plt.subplot(2, 1, 2)
plt.hist(horizonsH2_racing/10000, bins=num_sims/10, range=[2.,22.], normed=True, facecolor='red', align='mid', label='Racing')
plt.hist(horizonsC2_racing/10000, bins=num_sims/10, range=[2.,22.], normed=True, facecolor='green', align='mid', label='KL-Racing')
plt.hist(horizonsH2_LUCB/10000, bins=num_sims/10, range=[2.,22.], normed=True, facecolor='yellow', align='mid', label='LUCB')
plt.hist(horizonsC2_LUCB/10000, bins=num_sims/10, range=[2.,22.], normed=True, facecolor='blue', align='mid', label='KL-LUCB')
plt.legend(loc='best')
plt.xlabel('Samples / 10000')
plt.savefig('figure/flat_test2.png', bbox_inches='tight')
plt.close(fig)

# plot test 3
fig = plt.figure()
plt.plot(checkpoints/1000, errorrateH1_racing, 'ko-', label='Racing')
plt.plot(checkpoints/1000, errorrateC1_racing, 'bo-', label='KL-Racing')
plt.plot(checkpoints/1000, errorrateH1_LUCB, 'g^-', label='LUCB')
plt.plot(checkpoints/1000, errorrateC1_LUCB, 'y^-', label='KL-LUCB')
plt.legend(loc='best')
plt.title('Empirical mistake probability during run')
plt.xlabel('Samples / 1000')
plt.savefig('figure/flat_test3.png', bbox_inches='tight')
plt.close(fig)