class[['a, 'b]]q_learner :'a list -> 'b ->object..end
val mutable states : ('b * int) listval mutable num_states : intval actions : 'a arrayval num_actions : intval mutable q_table : ('b * float array) listval mutable current_state : 'bval mutable last_action : intval mutable delta : floatval mutable alpha : floatval mutable beta : floatmethod private get_best_action : unit -> intmethod get_action : unit -> 'amethod percieve_result : 'b -> float -> unit