danstowell · July 28, 2022 06:44
diff --git a/bootstrap_example.py b/bootstrap_example.py
 # example of bootstrap sampling to estimate confidence intervals on an accuracy measure

 import numpy as np


 nbootstraps   = 500 # 50 # 500    # note that 50 is fast enough for development purposes, but I use 500 for final evaluation

 # here's a VERY SHORT list of outcomes, each one reflecting whether sound X was correctly predicted or not
 outcomes = np.array([1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0])


 # here we can generate the indexing arrays for bootstrap sampling
 np.random.seed(1234)
 bootstrappers = [np.random.randint(0, len(outcomes), len(outcomes), int) for _ in range(nbootstraps)]

 accuracy = np.mean(outcomes)
 boo_accuracies = []
 for bootstrapper in bootstrappers:
    boo_accuracies.append(np.mean(outcomes[bootstrapper]))

 accuracy_lo = np.percentile(boo_accuracies,  2.5)
 accuracy_hi = np.percentile(boo_accuracies, 97.5)


 print(f"For {len(outcomes)} outcomes, the accuracy is {accuracy}, confidence interval [{accuracy_lo}, {accuracy_hi}]")
	# example of bootstrap sampling to estimate confidence intervals on an accuracy measure

	import numpy as np


	nbootstraps = 500 # 50 # 500 # note that 50 is fast enough for development purposes, but I use 500 for final evaluation

	# here's a VERY SHORT list of outcomes, each one reflecting whether sound X was correctly predicted or not
	outcomes = np.array([1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0])


	# here we can generate the indexing arrays for bootstrap sampling
	np.random.seed(1234)
	bootstrappers = [np.random.randint(0, len(outcomes), len(outcomes), int) for _ in range(nbootstraps)]

	accuracy = np.mean(outcomes)
	boo_accuracies = []
	for bootstrapper in bootstrappers:
	boo_accuracies.append(np.mean(outcomes[bootstrapper]))

	accuracy_lo = np.percentile(boo_accuracies, 2.5)
	accuracy_hi = np.percentile(boo_accuracies, 97.5)


	print(f"For {len(outcomes)} outcomes, the accuracy is {accuracy}, confidence interval [{accuracy_lo}, {accuracy_hi}]")
No results found