{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":591659031,"defaultBranch":"main","name":"Muesli-lunarlander","ownerLogin":"Itomigna2","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2023-01-21T12:55:32.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/119741210?v=4","public":true,"private":false,"isOrgOwned":false},"refInfo":{"name":"","listCacheKey":"v0:1709182603.0","currentOid":""},"activityList":{"items":[{"before":"d22cbdb90b73ae87312af0fb34ddebc378a7ddb4","after":"a09d8af69a5d7c38884b51b99637217d4001facc","ref":"refs/heads/main","pushedAt":"2024-03-18T01:38:06.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"Docs: change readme about gpu option","shortMessageHtmlLink":"Docs: change readme about gpu option"}},{"before":"53275f5dbffa04dd2bcbcff99a05278503ee4134","after":"d22cbdb90b73ae87312af0fb34ddebc378a7ddb4","ref":"refs/heads/main","pushedAt":"2024-03-15T09:02:08.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"Update README.md","shortMessageHtmlLink":"Update README.md"}},{"before":"441209e7e666c328ff85f80efb37ae27417d047e","after":"53275f5dbffa04dd2bcbcff99a05278503ee4134","ref":"refs/heads/main","pushedAt":"2024-03-15T09:01:47.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"Feat: HPO with Tensorboard\n\n- For the bug of using ms nni based HPO, (mismatched hyperparameter), so I use TensorBoard for HPO\n- some change to order of the params (just order changed)\n- manual will be described in README.","shortMessageHtmlLink":"Feat: HPO with Tensorboard"}},{"before":"aada386372ac81907b4a2da191920f1179fccf39","after":"441209e7e666c328ff85f80efb37ae27417d047e","ref":"refs/heads/main","pushedAt":"2024-03-11T01:19:33.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"Fix: remove dtype conversion\n\n- .float to input makes code slow a lot, it is removed\n- it fix the bugs related to process conflict and GPU resource conflict too.\ncloses #6","shortMessageHtmlLink":"Fix: remove dtype conversion"}},{"before":"a80ade484c3c1108d0c4f3db00baece56a7a125b","after":"aada386372ac81907b4a2da191920f1179fccf39","ref":"refs/heads/main","pushedAt":"2024-03-05T07:00:53.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"Update README.md","shortMessageHtmlLink":"Update README.md"}},{"before":"5824d0bf4e76b623c9ad92e3d18aa25786893265","after":"a80ade484c3c1108d0c4f3db00baece56a7a125b","ref":"refs/heads/main","pushedAt":"2024-03-04T05:33:31.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"Build: fix the jupyterlab-collaboration's version to 2.0.1","shortMessageHtmlLink":"Build: fix the jupyterlab-collaboration's version to 2.0.1"}},{"before":"c9f2442d213538a78ed74ee9cf7cf95616046da0","after":"5824d0bf4e76b623c9ad92e3d18aa25786893265","ref":"refs/heads/main","pushedAt":"2024-02-29T05:18:58.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"Update README.md","shortMessageHtmlLink":"Update README.md"}},{"before":"8deb159b79686582859cfe3d12d362026122b32f","after":null,"ref":"refs/heads/minigrid","pushedAt":"2024-02-29T04:56:43.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"}},{"before":null,"after":"8deb159b79686582859cfe3d12d362026122b32f","ref":"refs/heads/minigrid(deprecated)","pushedAt":"2024-02-29T04:56:42.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"Refactor: parameterize neg rew val","shortMessageHtmlLink":"Refactor: parameterize neg rew val"}},{"before":"feaa4b2ea65faafc1547c57b89167dc5e81e5d30","after":null,"ref":"refs/heads/hparam","pushedAt":"2024-02-29T04:56:25.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"}},{"before":null,"after":"feaa4b2ea65faafc1547c57b89167dc5e81e5d30","ref":"refs/heads/hparam(deprecated)","pushedAt":"2024-02-29T04:56:23.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"Refactor: hyperparameterize\n\n- hs resolution\n- loss weight\n- norm adv\n- discount","shortMessageHtmlLink":"Refactor: hyperparameterize"}},{"before":"71b45a68541c1122e0ad3360b23b720cb184ea2f","after":null,"ref":"refs/heads/lunar_rgb","pushedAt":"2024-02-29T04:56:15.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"}},{"before":null,"after":"71b45a68541c1122e0ad3360b23b720cb184ea2f","ref":"refs/heads/lunar_rgb(deprecated)","pushedAt":"2024-02-29T04:56:14.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"Feat: random seed on/off by param","shortMessageHtmlLink":"Feat: random seed on/off by param"}},{"before":"ccc3486963d341e2b651b3488cfb34062ce1bdd1","after":"c9f2442d213538a78ed74ee9cf7cf95616046da0","ref":"refs/heads/main","pushedAt":"2024-02-29T04:55:25.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"Merge: manually merged from lunar_rgb branch\n\n- Sorry for manual update due to twisted branching\n- It is relaying from lunar_rgb(deprecated)\n- more explanation will be commented on this commit","shortMessageHtmlLink":"Merge: manually merged from lunar_rgb branch"}},{"before":"6582b81570a85ece7b02dd7cd4f28c93a88ee1d0","after":"71b45a68541c1122e0ad3360b23b720cb184ea2f","ref":"refs/heads/lunar_rgb","pushedAt":"2024-02-29T02:21:23.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"Feat: random seed on/off by param","shortMessageHtmlLink":"Feat: random seed on/off by param"}},{"before":"70693a400fc2d677117dec3d2aec8a02b1bc9294","after":"6582b81570a85ece7b02dd7cd4f28c93a88ee1d0","ref":"refs/heads/lunar_rgb","pushedAt":"2024-02-29T00:49:10.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"Feat: Using deep IMPALA CNN\n\n- Change the shallow CNN to deep CNN described in IMPALA paper and it works!\n- change experiment length 4000->20000, RGB env needs more data and training than vector based env.\n-This version is working in the env with non-fixed random seed!\n- Training takes more than 15 hours, longer experiment length 5000>","shortMessageHtmlLink":"Feat: Using deep IMPALA CNN"}},{"before":"ccc3486963d341e2b651b3488cfb34062ce1bdd1","after":null,"ref":"refs/heads/lunar_vec","pushedAt":"2024-02-28T04:38:39.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"}},{"before":null,"after":"ccc3486963d341e2b651b3488cfb34062ce1bdd1","ref":"refs/heads/lunar_vec(deprecated)","pushedAt":"2024-02-28T04:38:37.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"Update README.md","shortMessageHtmlLink":"Update README.md"}},{"before":null,"after":"ccc3486963d341e2b651b3488cfb34062ce1bdd1","ref":"refs/heads/lunar_vec","pushedAt":"2024-02-28T04:38:20.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"Update README.md","shortMessageHtmlLink":"Update README.md"}},{"before":"9c230c5d3113fbd91850ffa0f3c6a12e21729afa","after":"70693a400fc2d677117dec3d2aec8a02b1bc9294","ref":"refs/heads/lunar_rgb","pushedAt":"2024-02-28T04:37:49.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"Update README.md","shortMessageHtmlLink":"Update README.md"}},{"before":"b23e2e6f80ea71a4a3c7e4a6bfa974de3c7251d2","after":"9c230c5d3113fbd91850ffa0f3c6a12e21729afa","ref":"refs/heads/lunar_rgb","pushedAt":"2024-02-28T02:21:40.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"Refactor: major changes on the network\n\n- I see light at the end of the tunnel, hope this network architecture is right.\n- Network is changed to CNN+LSTM based structure\n- Loss calculations are changed to matching the network’s in/output shapes.\n- Bug fix on categorical representation (related to softmax), with changing v,r model loss term as written in MuZero supplementary matarial.\n- Change KLdiv reduction method in the L_m loss calculation\n- Find hyperparameters\n- Draw more informations (value prediction, embbeding, adv norm related vars on TensorBoard\n- Mixed prior without P_traj(behavior policy)\n\n##Problems still remained\n- It can converse only when using environment with fixed random seed.\n- Still have some unstable convergence with small architecture change, hyperparameter change, random seed change.\n- CNN encoder is still weak. Better encoder need to be experimented.\n- Still without off-policy correction(V-trace, Retrace)","shortMessageHtmlLink":"Refactor: major changes on the network"}},{"before":"7f68252e73c71cea1f21bd4da0052d717d117dc7","after":null,"ref":"refs/heads/test_vecenv","pushedAt":"2024-02-01T00:10:06.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"}},{"before":"51a809b96067e11467b1a96d97fd2ff02fb19041","after":null,"ref":"refs/heads/atari","pushedAt":"2024-02-01T00:09:59.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"}},{"before":null,"after":"7f68252e73c71cea1f21bd4da0052d717d117dc7","ref":"refs/heads/test_vecenv","pushedAt":"2024-01-30T01:46:24.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"temp","shortMessageHtmlLink":"temp"}},{"before":"90e6e7facb9ec13627efd300b73a24879ae7ea66","after":"b23e2e6f80ea71a4a3c7e4a6bfa974de3c7251d2","ref":"refs/heads/lunar_rgb","pushedAt":"2024-01-26T05:06:16.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"Update README.md","shortMessageHtmlLink":"Update README.md"}},{"before":"b7afc8b8e5b9c757c1a8a824c7760fd8d641a2c5","after":"90e6e7facb9ec13627efd300b73a24879ae7ea66","ref":"refs/heads/lunar_rgb","pushedAt":"2024-01-26T01:51:30.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"Rename: move deprecated files","shortMessageHtmlLink":"Rename: move deprecated files"}},{"before":"1a2a8b399ab66254599eb137c256763a8a613ea9","after":"ccc3486963d341e2b651b3488cfb34062ce1bdd1","ref":"refs/heads/main","pushedAt":"2024-01-26T01:46:59.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"Update README.md","shortMessageHtmlLink":"Update README.md"}},{"before":"72bfafe62ee587784365b8da401691f8ca4c42c3","after":"b7afc8b8e5b9c757c1a8a824c7760fd8d641a2c5","ref":"refs/heads/lunar_rgb","pushedAt":"2024-01-26T01:21:37.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"Update README.md","shortMessageHtmlLink":"Update README.md"}},{"before":"961a1c8ead4519060ad8d913aac6d0712709872a","after":"72bfafe62ee587784365b8da401691f8ca4c42c3","ref":"refs/heads/lunar_rgb","pushedAt":"2024-01-25T08:50:45.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"Test\n\n- it still not work well.","shortMessageHtmlLink":"Test"}},{"before":"b62076f50523a9d04b452d9191db39b077b78eb4","after":"961a1c8ead4519060ad8d913aac6d0712709872a","ref":"refs/heads/lunar_rgb","pushedAt":"2024-01-24T08:58:14.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Itomigna2","name":null,"path":"/Itomigna2","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119741210?s=80&v=4"},"commit":{"message":"Refactor: can select about stacking action plane","shortMessageHtmlLink":"Refactor: can select about stacking action plane"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"startCursor":"Y3Vyc29yOnYyOpK7MjAyNC0wMy0xOFQwMTozODowNi4wMDAwMDBazwAAAAQYEj1V","endCursor":"Y3Vyc29yOnYyOpK7MjAyNC0wMS0yNFQwODo1ODoxNC4wMDAwMDBazwAAAAPntJT1"}},"title":"Activity · Itomigna2/Muesli-lunarlander"}