# -*- coding: utf-8 -*- """ Created on Fri May 6 13:22:05 2022 @author: turinici """ import numpy as np import matplotlib.pyplot as plt from tqdm import tqdm k,T,M,epsilon=10,1000,2000,0.1 rewards= np.zeros((T,M)) qstar_vec=np.zeros((k,M)) for m in tqdm(range(M)): qstar = np.random.randn(k) qstar_vec[:,m]=qstar count_vector=np.zeros(k) Q=np.zeros(k) for t in range(T): x = np.random.rand() if(x