--- reinforcement_learning/reinforce.py.orig 2025-02-09 16:56:58 UTC +++ reinforcement_learning/reinforce.py @@ -9,6 +9,9 @@ from torch.distributions import Categorical import torch.optim as optim from torch.distributions import Categorical +# numpy.bool8 is deprecated since version 1.24.0 +if not hasattr(np, 'bool8'): + np.bool8 = np.bool_ parser = argparse.ArgumentParser(description='PyTorch REINFORCE example') parser.add_argument('--gamma', type=float, default=0.99, metavar='G',