def upper_bound(self,t): mu = np.true_divide(self.success,self.trials) interval = np.sqrt(self.alpha*np.log(t)/(2.0*self.trials)) return mu+interval