float64[] weights uint16 final_step float64 reward