diff --git a/agent_code/auto_bomber/configs/configs.zip b/agent_code/auto_bomber/configs/configs.zip new file mode 100644 index 000000000..0d1a8dbf5 Binary files /dev/null and b/agent_code/auto_bomber/configs/configs.zip differ diff --git a/agent_code/auto_bomber/configs/create_config.py b/agent_code/auto_bomber/configs/create_config.py new file mode 100644 index 000000000..3c938c39e --- /dev/null +++ b/agent_code/auto_bomber/configs/create_config.py @@ -0,0 +1,50 @@ +import json +from pathlib import Path + +# EPSILONS = [0.15, 0.25, 0.35] +# DISCOUNTS = [0.35, 0.5, 0.65, 0.85, 0.95] +# LRS = [0.006, 0.0003, 0.00006, 0.00001, 0.000006] +# POLICIES = ['SOFTMAX', 'IANN'] +# TEMPERATURES = [0.3, 0.5, 0.7, 0.9] + +EPSILONS = [0.25] +DISCOUNTS = [0.4, 0.7, 0.9] +LRS = [0.006, 0.0003, 0.00009, 0.00001] +POLICIES = ['SOFTMAX', 'IANN'] +TEMPERATURES = [0.4, 0.7, 0.9] + + +def main(): + with open(Path('default_hyper_parameters.json')) as f: + default = json.load(f) + + for policy in POLICIES: + tmp = default + if policy == 'SOFTMAX': + for temp in TEMPERATURES: + for discount in DISCOUNTS: + for lr in LRS: + tmp['discount'] = discount + tmp['learning_rate'] = lr + tmp['policy'] = policy + tmp['temperature'] = temp + + with open(Path(f"./stable/stable_{policy}_temp{temp}_disc{discount}_lr{lr}.json"), 'w') as f: + json.dump(tmp, f) + elif policy == 'IANN': + for eps in EPSILONS: + for temp in TEMPERATURES: + for discount in DISCOUNTS: + for lr in LRS: + tmp['epsilon'] = eps + tmp['discount'] = discount + tmp['learning_rate'] = lr + tmp['policy'] = policy + tmp['temperature'] = temp + + with open(Path(f"./stable/stable_{policy}_eps{eps}_temp{temp}_disc{discount}_lr{lr}.json"), 'w') as f: + json.dump(tmp, f) + + +if __name__ == '__main__': + main() diff --git a/agent_code/auto_bomber/configs/default_hyper_parameters.json b/agent_code/auto_bomber/configs/default_hyper_parameters.json new file mode 100644 index 000000000..2e46f05ee --- /dev/null +++ b/agent_code/auto_bomber/configs/default_hyper_parameters.json @@ -0,0 +1,29 @@ +{ + "actions": [ + "UP", + "RIGHT", + "DOWN", + "LEFT", + "WAIT", + "BOMB" + ], + "epsilon": 0.25, + "discount": 0.85, + "learning_rate": 0.00009, + "policy": "SOFTMAX", + "temperature": 0.7, + "region_size": 2, + "region_time_tolerance": 6, + "game_rewards": { + "CRATE_DESTROYED": 70, + "COIN_FOUND": 30, + "COIN_COLLECTED": 70, + "KILLED_OPPONENT": 150, + "INVALID_ACTION": -100, + "KILLED_SELF": -150, + "GOT_KILLED": -50, + "SURVIVED_ROUND": 10, + "WAITED": -5, + "BOMB_DROPPED": 15 + } +} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.4_lr0.0003.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.4_lr0.0003.json new file mode 100644 index 000000000..3e2a4f1c8 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.4_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.0003, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.4_lr0.006.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.4_lr0.006.json new file mode 100644 index 000000000..ed044a761 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.4_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.006, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.4_lr1e-05.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.4_lr1e-05.json new file mode 100644 index 000000000..8250ae596 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.4_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 1e-05, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.4_lr9e-05.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.4_lr9e-05.json new file mode 100644 index 000000000..78083f93b --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.4_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 9e-05, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.7_lr0.0003.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.7_lr0.0003.json new file mode 100644 index 000000000..0e9013700 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.7_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.0003, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.7_lr0.006.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.7_lr0.006.json new file mode 100644 index 000000000..a93810631 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.7_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.006, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.7_lr1e-05.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.7_lr1e-05.json new file mode 100644 index 000000000..b8c1cc83c --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.7_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 1e-05, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.7_lr9e-05.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.7_lr9e-05.json new file mode 100644 index 000000000..abc4a2ac7 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.7_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 9e-05, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.9_lr0.0003.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.9_lr0.0003.json new file mode 100644 index 000000000..fc4f0085d --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.9_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.0003, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.9_lr0.006.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.9_lr0.006.json new file mode 100644 index 000000000..85abcc16e --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.9_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.006, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.9_lr1e-05.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.9_lr1e-05.json new file mode 100644 index 000000000..b64a9983e --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.9_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 1e-05, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.9_lr9e-05.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.9_lr9e-05.json new file mode 100644 index 000000000..02a2dbc8a --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.4_disc0.9_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 9e-05, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.4_lr0.0003.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.4_lr0.0003.json new file mode 100644 index 000000000..f845fb735 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.4_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.0003, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.4_lr0.006.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.4_lr0.006.json new file mode 100644 index 000000000..e91841c30 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.4_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.006, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.4_lr1e-05.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.4_lr1e-05.json new file mode 100644 index 000000000..848d7ba20 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.4_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 1e-05, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.4_lr9e-05.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.4_lr9e-05.json new file mode 100644 index 000000000..7f0350d49 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.4_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 9e-05, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.7_lr0.0003.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.7_lr0.0003.json new file mode 100644 index 000000000..1df50827e --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.7_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.0003, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.7_lr0.006.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.7_lr0.006.json new file mode 100644 index 000000000..91fc34c86 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.7_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.006, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.7_lr1e-05.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.7_lr1e-05.json new file mode 100644 index 000000000..6a4e373ba --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.7_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 1e-05, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.7_lr9e-05.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.7_lr9e-05.json new file mode 100644 index 000000000..438bba24e --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.7_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 9e-05, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.9_lr0.0003.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.9_lr0.0003.json new file mode 100644 index 000000000..cde2fdffd --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.9_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.0003, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.9_lr0.006.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.9_lr0.006.json new file mode 100644 index 000000000..935a68ed0 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.9_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.006, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.9_lr1e-05.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.9_lr1e-05.json new file mode 100644 index 000000000..f0c867da4 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.9_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 1e-05, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.9_lr9e-05.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.9_lr9e-05.json new file mode 100644 index 000000000..3ecae7cd7 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.7_disc0.9_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 9e-05, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.4_lr0.0003.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.4_lr0.0003.json new file mode 100644 index 000000000..c71e4734b --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.4_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.0003, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.4_lr0.006.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.4_lr0.006.json new file mode 100644 index 000000000..8ea7172d6 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.4_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.006, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.4_lr1e-05.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.4_lr1e-05.json new file mode 100644 index 000000000..75a6e685f --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.4_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 1e-05, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.4_lr9e-05.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.4_lr9e-05.json new file mode 100644 index 000000000..c3a5f542e --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.4_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 9e-05, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.7_lr0.0003.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.7_lr0.0003.json new file mode 100644 index 000000000..24dd4c30a --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.7_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.0003, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.7_lr0.006.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.7_lr0.006.json new file mode 100644 index 000000000..15c9d5e74 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.7_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.006, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.7_lr1e-05.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.7_lr1e-05.json new file mode 100644 index 000000000..7911a6130 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.7_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 1e-05, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.7_lr9e-05.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.7_lr9e-05.json new file mode 100644 index 000000000..f4300ff0a --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.7_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 9e-05, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.9_lr0.0003.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.9_lr0.0003.json new file mode 100644 index 000000000..73007ec20 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.9_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.0003, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.9_lr0.006.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.9_lr0.006.json new file mode 100644 index 000000000..5ba769158 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.9_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.006, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.9_lr1e-05.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.9_lr1e-05.json new file mode 100644 index 000000000..aa19380ac --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.9_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 1e-05, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.9_lr9e-05.json b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.9_lr9e-05.json new file mode 100644 index 000000000..4ad70c444 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_IANN_eps0.25_temp0.9_disc0.9_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 9e-05, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.4_lr0.0003.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.4_lr0.0003.json new file mode 100644 index 000000000..b7de1c2ab --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.4_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.0003, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.4_lr0.006.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.4_lr0.006.json new file mode 100644 index 000000000..41b8096d4 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.4_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.006, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.4_lr1e-05.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.4_lr1e-05.json new file mode 100644 index 000000000..e28d0810e --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.4_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 1e-05, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.4_lr9e-05.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.4_lr9e-05.json new file mode 100644 index 000000000..9916eec9d --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.4_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 9e-05, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.7_lr0.0003.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.7_lr0.0003.json new file mode 100644 index 000000000..195ffed73 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.7_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.0003, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.7_lr0.006.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.7_lr0.006.json new file mode 100644 index 000000000..5e4ed5765 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.7_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.006, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.7_lr1e-05.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.7_lr1e-05.json new file mode 100644 index 000000000..ab1042124 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.7_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 1e-05, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.7_lr9e-05.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.7_lr9e-05.json new file mode 100644 index 000000000..7caa5422b --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.7_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 9e-05, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.9_lr0.0003.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.9_lr0.0003.json new file mode 100644 index 000000000..5cd361236 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.9_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.0003, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.9_lr0.006.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.9_lr0.006.json new file mode 100644 index 000000000..8548f3e2b --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.9_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.006, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.9_lr1e-05.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.9_lr1e-05.json new file mode 100644 index 000000000..344061cb1 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.9_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 1e-05, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.9_lr9e-05.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.9_lr9e-05.json new file mode 100644 index 000000000..348e35434 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.4_disc0.9_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 9e-05, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.4_lr0.0003.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.4_lr0.0003.json new file mode 100644 index 000000000..e0a6e407d --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.4_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.0003, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.4_lr0.006.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.4_lr0.006.json new file mode 100644 index 000000000..7f58db255 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.4_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.006, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.4_lr1e-05.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.4_lr1e-05.json new file mode 100644 index 000000000..227b4fa58 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.4_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 1e-05, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.4_lr9e-05.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.4_lr9e-05.json new file mode 100644 index 000000000..a2aea418d --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.4_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 9e-05, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.7_lr0.0003.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.7_lr0.0003.json new file mode 100644 index 000000000..48c28d0dd --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.7_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.0003, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.7_lr0.006.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.7_lr0.006.json new file mode 100644 index 000000000..12bd715c1 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.7_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.006, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.7_lr1e-05.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.7_lr1e-05.json new file mode 100644 index 000000000..fb3dfe40b --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.7_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 1e-05, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.7_lr9e-05.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.7_lr9e-05.json new file mode 100644 index 000000000..6aec9f6c3 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.7_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 9e-05, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.9_lr0.0003.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.9_lr0.0003.json new file mode 100644 index 000000000..e0e50e888 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.9_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.0003, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.9_lr0.006.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.9_lr0.006.json new file mode 100644 index 000000000..3800ecc0c --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.9_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.006, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.9_lr1e-05.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.9_lr1e-05.json new file mode 100644 index 000000000..77dd7215c --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.9_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 1e-05, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.9_lr9e-05.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.9_lr9e-05.json new file mode 100644 index 000000000..1f29fcbff --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.7_disc0.9_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 9e-05, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.4_lr0.0003.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.4_lr0.0003.json new file mode 100644 index 000000000..572ce81e1 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.4_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.0003, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.4_lr0.006.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.4_lr0.006.json new file mode 100644 index 000000000..a3398bded --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.4_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.006, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.4_lr1e-05.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.4_lr1e-05.json new file mode 100644 index 000000000..14cceb463 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.4_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 1e-05, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.4_lr9e-05.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.4_lr9e-05.json new file mode 100644 index 000000000..8ee7f7883 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.4_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 9e-05, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.7_lr0.0003.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.7_lr0.0003.json new file mode 100644 index 000000000..6004d1157 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.7_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.0003, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.7_lr0.006.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.7_lr0.006.json new file mode 100644 index 000000000..97b85c511 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.7_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.006, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.7_lr1e-05.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.7_lr1e-05.json new file mode 100644 index 000000000..17cafe20d --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.7_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 1e-05, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.7_lr9e-05.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.7_lr9e-05.json new file mode 100644 index 000000000..d772c6d0c --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.7_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 9e-05, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.9_lr0.0003.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.9_lr0.0003.json new file mode 100644 index 000000000..8538263d9 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.9_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.0003, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.9_lr0.006.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.9_lr0.006.json new file mode 100644 index 000000000..b68ba9e26 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.9_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.006, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.9_lr1e-05.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.9_lr1e-05.json new file mode 100644 index 000000000..5a96c5bad --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.9_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 1e-05, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.9_lr9e-05.json b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.9_lr9e-05.json new file mode 100644 index 000000000..88ef3f776 --- /dev/null +++ b/agent_code/auto_bomber/configs/interesting/beta_SOFTMAX_temp0.9_disc0.9_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 9e-05, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 40, "COIN_FOUND": 20, "COIN_COLLECTED": 50, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 80, "WAITED": -5, "BOMB_DROPPED": 10}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.4_lr0.0003.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.4_lr0.0003.json new file mode 100644 index 000000000..1a1a2a197 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.4_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.0003, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.4_lr0.006.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.4_lr0.006.json new file mode 100644 index 000000000..e557d13d1 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.4_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.006, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.4_lr1e-05.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.4_lr1e-05.json new file mode 100644 index 000000000..f8d972fa1 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.4_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 1e-05, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.4_lr9e-05.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.4_lr9e-05.json new file mode 100644 index 000000000..0c4f196f7 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.4_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 9e-05, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.7_lr0.0003.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.7_lr0.0003.json new file mode 100644 index 000000000..f50f4a42b --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.7_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.0003, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.7_lr0.006.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.7_lr0.006.json new file mode 100644 index 000000000..415166cfd --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.7_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.006, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.7_lr1e-05.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.7_lr1e-05.json new file mode 100644 index 000000000..9a16451af --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.7_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 1e-05, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.7_lr9e-05.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.7_lr9e-05.json new file mode 100644 index 000000000..94dcb8978 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.7_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 9e-05, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.9_lr0.0003.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.9_lr0.0003.json new file mode 100644 index 000000000..97c2451e5 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.9_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.0003, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.9_lr0.006.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.9_lr0.006.json new file mode 100644 index 000000000..2e525deb2 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.9_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.006, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.9_lr1e-05.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.9_lr1e-05.json new file mode 100644 index 000000000..3829ce658 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.9_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 1e-05, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.9_lr9e-05.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.9_lr9e-05.json new file mode 100644 index 000000000..b7dad9111 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.4_disc0.9_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 9e-05, "policy": "IANN", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.4_lr0.0003.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.4_lr0.0003.json new file mode 100644 index 000000000..62d188bbb --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.4_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.0003, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.4_lr0.006.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.4_lr0.006.json new file mode 100644 index 000000000..b2a560020 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.4_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.006, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.4_lr1e-05.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.4_lr1e-05.json new file mode 100644 index 000000000..452eaa3be --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.4_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 1e-05, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.4_lr9e-05.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.4_lr9e-05.json new file mode 100644 index 000000000..41e36265c --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.4_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 9e-05, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.7_lr0.0003.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.7_lr0.0003.json new file mode 100644 index 000000000..1dbf12914 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.7_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.0003, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.7_lr0.006.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.7_lr0.006.json new file mode 100644 index 000000000..b9191d6a4 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.7_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.006, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.7_lr1e-05.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.7_lr1e-05.json new file mode 100644 index 000000000..1a7c96c5f --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.7_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 1e-05, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.7_lr9e-05.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.7_lr9e-05.json new file mode 100644 index 000000000..8e73e61c5 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.7_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 9e-05, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.9_lr0.0003.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.9_lr0.0003.json new file mode 100644 index 000000000..0a4e03a91 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.9_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.0003, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.9_lr0.006.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.9_lr0.006.json new file mode 100644 index 000000000..450f49a4f --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.9_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.006, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.9_lr1e-05.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.9_lr1e-05.json new file mode 100644 index 000000000..96ca5cd77 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.9_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 1e-05, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.9_lr9e-05.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.9_lr9e-05.json new file mode 100644 index 000000000..430802f5f --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.7_disc0.9_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 9e-05, "policy": "IANN", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.4_lr0.0003.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.4_lr0.0003.json new file mode 100644 index 000000000..9c97527dd --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.4_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.0003, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.4_lr0.006.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.4_lr0.006.json new file mode 100644 index 000000000..a861e099e --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.4_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.006, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.4_lr1e-05.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.4_lr1e-05.json new file mode 100644 index 000000000..12a71fd2e --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.4_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 1e-05, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.4_lr9e-05.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.4_lr9e-05.json new file mode 100644 index 000000000..9cdde96c4 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.4_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 9e-05, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.7_lr0.0003.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.7_lr0.0003.json new file mode 100644 index 000000000..db0156963 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.7_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.0003, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.7_lr0.006.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.7_lr0.006.json new file mode 100644 index 000000000..60da1aaf4 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.7_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.006, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.7_lr1e-05.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.7_lr1e-05.json new file mode 100644 index 000000000..12fc4ec67 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.7_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 1e-05, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.7_lr9e-05.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.7_lr9e-05.json new file mode 100644 index 000000000..d0d0685fd --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.7_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 9e-05, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.9_lr0.0003.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.9_lr0.0003.json new file mode 100644 index 000000000..96a90f617 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.9_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.0003, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.9_lr0.006.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.9_lr0.006.json new file mode 100644 index 000000000..1f80add38 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.9_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.006, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.9_lr1e-05.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.9_lr1e-05.json new file mode 100644 index 000000000..73543d114 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.9_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 1e-05, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.9_lr9e-05.json b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.9_lr9e-05.json new file mode 100644 index 000000000..a1fe2982d --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_IANN_eps0.25_temp0.9_disc0.9_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 9e-05, "policy": "IANN", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.4_lr0.0003.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.4_lr0.0003.json new file mode 100644 index 000000000..d5c9f9e35 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.4_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.0003, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.4_lr0.006.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.4_lr0.006.json new file mode 100644 index 000000000..59f0caea8 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.4_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.006, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.4_lr1e-05.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.4_lr1e-05.json new file mode 100644 index 000000000..59b11766e --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.4_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 1e-05, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.4_lr9e-05.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.4_lr9e-05.json new file mode 100644 index 000000000..108ecb429 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.4_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 9e-05, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.7_lr0.0003.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.7_lr0.0003.json new file mode 100644 index 000000000..3f6ffaf83 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.7_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.0003, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.7_lr0.006.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.7_lr0.006.json new file mode 100644 index 000000000..91ea79db2 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.7_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.006, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.7_lr1e-05.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.7_lr1e-05.json new file mode 100644 index 000000000..88eb8d6c1 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.7_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 1e-05, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.7_lr9e-05.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.7_lr9e-05.json new file mode 100644 index 000000000..5e2ca3f48 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.7_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 9e-05, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.9_lr0.0003.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.9_lr0.0003.json new file mode 100644 index 000000000..856ad541f --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.9_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.0003, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.9_lr0.006.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.9_lr0.006.json new file mode 100644 index 000000000..412d169b4 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.9_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.006, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.9_lr1e-05.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.9_lr1e-05.json new file mode 100644 index 000000000..9a349f69a --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.9_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 1e-05, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.9_lr9e-05.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.9_lr9e-05.json new file mode 100644 index 000000000..d2dd16741 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.4_disc0.9_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 9e-05, "policy": "SOFTMAX", "temperature": 0.4, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.4_lr0.0003.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.4_lr0.0003.json new file mode 100644 index 000000000..9a0da0919 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.4_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.0003, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.4_lr0.006.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.4_lr0.006.json new file mode 100644 index 000000000..5d25689f1 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.4_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.006, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.4_lr1e-05.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.4_lr1e-05.json new file mode 100644 index 000000000..fa7d0709a --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.4_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 1e-05, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.4_lr9e-05.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.4_lr9e-05.json new file mode 100644 index 000000000..1730d5678 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.4_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 9e-05, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.7_lr0.0003.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.7_lr0.0003.json new file mode 100644 index 000000000..8f3ce5e17 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.7_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.0003, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.7_lr0.006.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.7_lr0.006.json new file mode 100644 index 000000000..e64aa6fca --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.7_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.006, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.7_lr1e-05.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.7_lr1e-05.json new file mode 100644 index 000000000..e5ec9ee98 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.7_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 1e-05, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.7_lr9e-05.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.7_lr9e-05.json new file mode 100644 index 000000000..0ad900924 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.7_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 9e-05, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.9_lr0.0003.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.9_lr0.0003.json new file mode 100644 index 000000000..14b71c76c --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.9_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.0003, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.9_lr0.006.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.9_lr0.006.json new file mode 100644 index 000000000..ea877a20c --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.9_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.006, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.9_lr1e-05.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.9_lr1e-05.json new file mode 100644 index 000000000..f2022c968 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.9_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 1e-05, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.9_lr9e-05.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.9_lr9e-05.json new file mode 100644 index 000000000..e21cc7163 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.7_disc0.9_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 9e-05, "policy": "SOFTMAX", "temperature": 0.7, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.4_lr0.0003.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.4_lr0.0003.json new file mode 100644 index 000000000..3376bfb25 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.4_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.0003, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.4_lr0.006.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.4_lr0.006.json new file mode 100644 index 000000000..01b6e4572 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.4_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 0.006, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.4_lr1e-05.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.4_lr1e-05.json new file mode 100644 index 000000000..51ab282d2 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.4_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 1e-05, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.4_lr9e-05.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.4_lr9e-05.json new file mode 100644 index 000000000..efb2223cf --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.4_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.4, "learning_rate": 9e-05, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.7_lr0.0003.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.7_lr0.0003.json new file mode 100644 index 000000000..6191396be --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.7_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.0003, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.7_lr0.006.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.7_lr0.006.json new file mode 100644 index 000000000..dc9b300c8 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.7_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 0.006, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.7_lr1e-05.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.7_lr1e-05.json new file mode 100644 index 000000000..995824813 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.7_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 1e-05, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.7_lr9e-05.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.7_lr9e-05.json new file mode 100644 index 000000000..db8cfb8c9 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.7_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.7, "learning_rate": 9e-05, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.9_lr0.0003.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.9_lr0.0003.json new file mode 100644 index 000000000..5ea600173 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.9_lr0.0003.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.0003, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.9_lr0.006.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.9_lr0.006.json new file mode 100644 index 000000000..39ee162d6 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.9_lr0.006.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 0.006, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.9_lr1e-05.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.9_lr1e-05.json new file mode 100644 index 000000000..c9e072fcf --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.9_lr1e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 1e-05, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.9_lr9e-05.json b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.9_lr9e-05.json new file mode 100644 index 000000000..d63738662 --- /dev/null +++ b/agent_code/auto_bomber/configs/stable/stable_SOFTMAX_temp0.9_disc0.9_lr9e-05.json @@ -0,0 +1 @@ +{"actions": ["UP", "RIGHT", "DOWN", "LEFT", "WAIT", "BOMB"], "epsilon": 0.25, "discount": 0.9, "learning_rate": 9e-05, "policy": "SOFTMAX", "temperature": 0.9, "region_size": 2, "region_time_tolerance": 6, "game_rewards": {"CRATE_DESTROYED": 70, "COIN_FOUND": 30, "COIN_COLLECTED": 70, "KILLED_OPPONENT": 150, "INVALID_ACTION": -100, "KILLED_SELF": -150, "GOT_KILLED": -50, "SURVIVED_ROUND": 10, "WAITED": -5, "BOMB_DROPPED": 15}} \ No newline at end of file diff --git a/agent_code/auto_bomber/feature_engineering.py b/agent_code/auto_bomber/feature_engineering.py index 12baeaf06..42e2d0c22 100644 --- a/agent_code/auto_bomber/feature_engineering.py +++ b/agent_code/auto_bomber/feature_engineering.py @@ -71,7 +71,7 @@ def state_to_features(game_state: dict) -> np.array: weights=opponents_bomb_action, aggregation_func=lambda v: np.mean(v) if v.size != 0 else 0.0, # normalization_func=lambda v: np.divide(v, np.max(v), out=np.zeros_like(v), where=v != 0)) - normalization_func=lambda v:np.divide(1, v, out=np.zeros_like(v), where=v != 0)) + normalization_func=lambda v: np.divide(1, v, out=np.zeros_like(v), where=v != 0)) # TODO Evaluate if weighting bombs also here by their countdown # TODO Exclude bombs which are not relevant (!!!!) diff --git a/settings.py b/settings.py index a98b08d96..53801104d 100644 --- a/settings.py +++ b/settings.py @@ -5,7 +5,7 @@ # Game properties COLS = 17 ROWS = 17 -CRATE_DENSITY = 0.15 # 0.25 # 0.75 +CRATE_DENSITY = 0.15 # 0.75 MAX_AGENTS = 4 # Round properties