deltas = [r + gamma * (1 - d) * nv - v for r, d, nv, v in zip(rewards, dones, next_values, values)] TypeError: unsupported operand type(s) for +: 'NoneType' and 'float'