From 89059e1db035f802fb1b1d82e04811d50274ed18 Mon Sep 17 00:00:00 2001 From: Adrian Egli Date: Wed, 23 Apr 2025 16:29:33 +0200 Subject: [PATCH 1/3] Update plot.py fix; typo in the resdir (path) --- distributed_q_learning/plot/plot.py | 13 ++----------- 1 file changed, 2 insertions(+), 11 deletions(-) diff --git a/distributed_q_learning/plot/plot.py b/distributed_q_learning/plot/plot.py index 58ba309..9d3f47e 100644 --- a/distributed_q_learning/plot/plot.py +++ b/distributed_q_learning/plot/plot.py @@ -26,20 +26,11 @@ def running_avg(x, ws): if __name__=='__main__': - resdir = '../experiments/reproduce_deterministic' + resdir = '../experiments/reproduce_determinstic/' parq_list = glob.glob(join(resdir, '*/tr_rewards.parquet')) config_list = glob.glob(join(resdir, '*/*_config.csv')) - - config_list = [ - '../experiments/reproduce_deterministic/1/1_config.csv', - '../experiments/reproduce_deterministic/2/2_config.csv', - '../experiments/reproduce_deterministic/3/3_config.csv', - '../experiments/reproduce_deterministic/4/4_config.csv', - '../experiments/reproduce_deterministic/5/5_config.csv', - ] - ws = 5000 plt.figure(figsize=(15,7), dpi=80) @@ -68,4 +59,4 @@ def running_avg(x, ws): plt.xlabel('Episodes') plt.ylabel('Cumulative reward') plt.tight_layout() - plt.savefig('training.png') \ No newline at end of file + plt.savefig('training.png') From d9a7244db70e51cd1c8d2acd6e6fc39564445d59 Mon Sep 17 00:00:00 2001 From: Adrian Egli Date: Wed, 23 Apr 2025 17:55:21 +0200 Subject: [PATCH 2/3] Update train.py Typo --- distributed_q_learning/train.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/distributed_q_learning/train.py b/distributed_q_learning/train.py index 51f2c00..d9da105 100644 --- a/distributed_q_learning/train.py +++ b/distributed_q_learning/train.py @@ -207,7 +207,7 @@ def eval_batch( ], columns=['epsilon', 'epsilon decay', 'alpha', 'alpha decay', 'n_episodes']) # Other parameters -out_dir = 'experiments/reproduce_determinstic' +out_dir = 'experiments/reproduce_deterministic' n_workers = multiprocessing.cpu_count() master_seed = 666 log_every = 10_000 From 8ae50711ce043d5e0dfba678c8c86c5a2c88b233 Mon Sep 17 00:00:00 2001 From: Adrian Egli Date: Wed, 23 Apr 2025 17:56:16 +0200 Subject: [PATCH 3/3] Update plot.py Typo sync --- distributed_q_learning/plot/plot.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/distributed_q_learning/plot/plot.py b/distributed_q_learning/plot/plot.py index 9d3f47e..5f66dcf 100644 --- a/distributed_q_learning/plot/plot.py +++ b/distributed_q_learning/plot/plot.py @@ -26,7 +26,7 @@ def running_avg(x, ws): if __name__=='__main__': - resdir = '../experiments/reproduce_determinstic/' + resdir = '../experiments/reproduce_deterministic/' parq_list = glob.glob(join(resdir, '*/tr_rewards.parquet')) config_list = glob.glob(join(resdir, '*/*_config.csv'))