diff --git a/open_spiel/python/pytorch/dqn.py b/open_spiel/python/pytorch/dqn.py index 7b5bc775e9..0bb2bb6657 100644 --- a/open_spiel/python/pytorch/dqn.py +++ b/open_spiel/python/pytorch/dqn.py @@ -16,7 +16,6 @@ import collections import math -import sys import numpy as np from scipy import stats import torch @@ -30,7 +29,7 @@ "Transition", "info_state action reward next_info_state is_final_step legal_actions_mask") -ILLEGAL_ACTION_LOGITS_PENALTY = sys.float_info.min +ILLEGAL_ACTION_LOGITS_PENALTY = torch.finfo(torch.float).min class SonnetLinear(nn.Module):