{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":686160414,"defaultBranch":"main","name":"NeMo-Aligner","ownerLogin":"NVIDIA","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2023-09-01T22:46:28.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/1728152?v=4","public":true,"private":false,"isOrgOwned":true},"refInfo":{"name":"","listCacheKey":"v0:1720131851.0","currentOid":""},"activityList":{"items":[{"before":"6ad02bd0b75f8ef93b28b0f89238d4cafaa42f3a","after":"82b5ae8f4415a265ce9e84229f349f0733f88741","ref":"refs/heads/yi/trtllm_support","pushedAt":"2024-07-04T22:30:08.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"yidong72","name":"Yi Dong","path":"/yidong72","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/43824965?s=80&v=4"},"commit":{"message":"remove threading\n\nSigned-off-by: Yi Dong ","shortMessageHtmlLink":"remove threading"}},{"before":null,"after":"81bb931f3418b250b01984fe6b5861dc8101454a","ref":"refs/heads/yi/trtllm_tree","pushedAt":"2024-07-04T22:24:11.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"yidong72","name":"Yi Dong","path":"/yidong72","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/43824965?s=80&v=4"},"commit":{"message":"init\n\nSigned-off-by: Yi Dong ","shortMessageHtmlLink":"init"}},{"before":"2705861f7626f52271130042f237a6ae141cc2d2","after":"7d3f43c6eb95bcc1c52151d8b786c7a89a0f2f17","ref":"refs/heads/cai","pushedAt":"2024-07-04T08:07:19.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"snisimov","name":null,"path":"/snisimov","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/150595186?s=80&v=4"},"commit":{"message":"minor (documentation update)\n\n\nSigned-off-by: shami nisimov ","shortMessageHtmlLink":"minor (documentation update)"}},{"before":"1d651fbad5aff9907afd522188ef7b451a076c75","after":"2705861f7626f52271130042f237a6ae141cc2d2","ref":"refs/heads/cai","pushedAt":"2024-07-04T07:17:30.000Z","pushType":"push","commitsCount":3,"pusher":{"login":"snisimov","name":null,"path":"/snisimov","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/150595186?s=80&v=4"},"commit":{"message":"Merge branch 'main' into cai","shortMessageHtmlLink":"Merge branch 'main' into cai"}},{"before":"b0f6d559e40131396aafb71b57823444bf4523b8","after":"1d651fbad5aff9907afd522188ef7b451a076c75","ref":"refs/heads/cai","pushedAt":"2024-07-04T07:11:47.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"snisimov","name":null,"path":"/snisimov","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/150595186?s=80&v=4"},"commit":{"message":"minor comment change\n\nSigned-off-by: snisimov ","shortMessageHtmlLink":"minor comment change"}},{"before":"2775e816424dbbb5b6c02f3c3838b962babb9475","after":"d85b62c0b62732e9df88abfdceb15107ecc04cf9","ref":"refs/heads/geshen/critic_speedup","pushedAt":"2024-07-03T23:42:44.000Z","pushType":"push","commitsCount":7,"pusher":{"login":"gshennvm","name":"Gerald Shen","path":"/gshennvm","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119401249?s=80&v=4"},"commit":{"message":"fix signature of tokenize batch\n\nSigned-off-by: Gerald Shen ","shortMessageHtmlLink":"fix signature of tokenize batch"}},{"before":"dec062187d978466c292a6cb28abba3491bda095","after":"f889f8951fcb290df1cc2c489839e660ee40d721","ref":"refs/heads/degert/spin-save-generations","pushedAt":"2024-07-03T23:37:14.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"trias702","name":null,"path":"/trias702","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/25867060?s=80&v=4"},"commit":{"message":"Padded generations to same shape\n\nSigned-off-by: Daniel Egert ","shortMessageHtmlLink":"Padded generations to same shape"}},{"before":"afc5d1bf71186aae719505aca0ef7ae6913b96a2","after":null,"ref":"refs/heads/terryk/str-generate","pushedAt":"2024-07-03T23:35:38.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"terrykong","name":"Terry Kong","path":"/terrykong","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7576060?s=80&v=4"}},{"before":"2421c7354232bb08f89100ed2c297eae938d5ee9","after":"e946f5d4fd27a3ea5d644542b0a1e77cd105da68","ref":"refs/heads/main","pushedAt":"2024-07-03T23:35:28.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"terrykong","name":"Terry Kong","path":"/terrykong","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7576060?s=80&v=4"},"commit":{"message":"Add feat to allow GPTSFTModel.generate from str inputs (#229)\n\n* Add feat to allow GPTSFTModel.generate from str inputs\r\n\r\nThe type support for inputs now matches MegatronGPTModel\r\nwhich was important to use megatron_gpt_eval.py\r\n\r\nSigned-off-by: Terry Kong \r\n\r\n* [pre-commit.ci] auto fixes from pre-commit.com hooks\r\n\r\nfor more information, see https://pre-commit.ci\r\n\r\n---------\r\n\r\nSigned-off-by: Terry Kong \r\nCo-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>","shortMessageHtmlLink":"Add feat to allow GPTSFTModel.generate from str inputs (#229)"}},{"before":"af0dbf38417f5c3b451efc47ab109d76e96dc9da","after":"afc5d1bf71186aae719505aca0ef7ae6913b96a2","ref":"refs/heads/terryk/str-generate","pushedAt":"2024-07-03T22:29:06.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"pre-commit-ci[bot]","name":null,"path":"/apps/pre-commit-ci","primaryAvatarUrl":"https://avatars.githubusercontent.com/in/68672?s=80&v=4"},"commit":{"message":"[pre-commit.ci] auto fixes from pre-commit.com hooks\n\nfor more information, see https://pre-commit.ci","shortMessageHtmlLink":"[pre-commit.ci] auto fixes from pre-commit.com hooks"}},{"before":"8d8ef38bc7b190d9a3d0b5face76147b9e0ae863","after":"af0dbf38417f5c3b451efc47ab109d76e96dc9da","ref":"refs/heads/terryk/str-generate","pushedAt":"2024-07-03T22:28:32.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"terrykong","name":"Terry Kong","path":"/terrykong","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7576060?s=80&v=4"},"commit":{"message":"Add feat to allow GPTSFTModel.generate from str inputs\n\nThe type support for inputs now matches MegatronGPTModel\nwhich was important to use megatron_gpt_eval.py\n\nSigned-off-by: Terry Kong ","shortMessageHtmlLink":"Add feat to allow GPTSFTModel.generate from str inputs"}},{"before":"c713cecb4b56c3c5dee2a681734102f6f00422f1","after":"78ef52911bf3a9e55f4c258d96c7f4b2652766fa","ref":"refs/heads/ssy/fix-ref-policy","pushedAt":"2024-07-03T22:24:32.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"pre-commit-ci[bot]","name":null,"path":"/apps/pre-commit-ci","primaryAvatarUrl":"https://avatars.githubusercontent.com/in/68672?s=80&v=4"},"commit":{"message":"[pre-commit.ci] auto fixes from pre-commit.com hooks\n\nfor more information, see https://pre-commit.ci","shortMessageHtmlLink":"[pre-commit.ci] auto fixes from pre-commit.com hooks"}},{"before":null,"after":"c713cecb4b56c3c5dee2a681734102f6f00422f1","ref":"refs/heads/ssy/fix-ref-policy","pushedAt":"2024-07-03T22:17:02.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"shengyangs","name":"Shengyang Sun","path":"/shengyangs","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/150360624?s=80&v=4"},"commit":{"message":"fix log probs mismatch\n\nSigned-off-by: Shengyang Sun ","shortMessageHtmlLink":"fix log probs mismatch"}},{"before":null,"after":"dec062187d978466c292a6cb28abba3491bda095","ref":"refs/heads/degert/spin-save-generations","pushedAt":"2024-07-03T21:25:19.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"trias702","name":null,"path":"/trias702","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/25867060?s=80&v=4"},"commit":{"message":"Initial commit\n\nSigned-off-by: Daniel Egert ","shortMessageHtmlLink":"Initial commit"}},{"before":"8d8ef38bc7b190d9a3d0b5face76147b9e0ae863","after":"2421c7354232bb08f89100ed2c297eae938d5ee9","ref":"refs/heads/main","pushedAt":"2024-07-03T19:57:13.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"shengyangs","name":"Shengyang Sun","path":"/shengyangs","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/150360624?s=80&v=4"},"commit":{"message":"Implement the reward aware preference optimization algorithms. (#195)\n\n* Implement the reward_aware_po algorithms.\r\n\r\ninit\r\n\r\nenable gt_reward scale\r\n\r\nenable kl_penalty restoring by state_dict\r\n\r\nfix typo\r\n\r\nswap reward_dpo & reward_rev_dpo\r\n\r\nfix reward type bug\r\n\r\nrmv loss average\r\n\r\nremove ref_policy_kl_penalty out of state dict\r\n\r\nupdate default chosen_reward in rpo\r\n\r\nrmv ref_policy_kl_penalty from wandb metrics\r\n\r\nupdate conf\r\n\r\nupdate dpo_loss_weight and sft_loss_weight\r\n\r\nSigned-off-by: Shengyang Sun \r\n\r\npolish RPO code; add comments\r\n\r\nSigned-off-by: Shengyang Sun \r\n\r\n[pre-commit.ci] auto fixes from pre-commit.com hooks\r\n\r\nfor more information, see https://pre-commit.ci\r\n\r\n[pre-commit.ci] auto fixes from pre-commit.com hooks\r\n\r\nfor more information, see https://pre-commit.ci\r\n\r\nfix loss computation\r\n\r\nSigned-off-by: Gerald Shen \r\n\r\naverage log prob for SFT should be set to True\r\n\r\nSigned-off-by: Gerald Shen \r\n\r\nRevert \"average log prob for SFT should be set to True\"\r\n\r\nThis reverts commit 8feb093655d753bdf63a487bbe59f84d8a1079d2.\r\n\r\nrename rpo; separate avg_logprobs; update rst\r\n\r\nSigned-off-by: Shengyang Sun \r\n\r\nmove nograd_length to constructor\r\n\r\nSigned-off-by: Shengyang Sun \r\n\r\n* [pre-commit.ci] auto fixes from pre-commit.com hooks\r\n\r\nfor more information, see https://pre-commit.ci\r\n\r\n* fix rpo default reward config\r\n\r\nSigned-off-by: Shengyang Sun \r\n\r\n---------\r\n\r\nSigned-off-by: Shengyang Sun \r\nCo-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>\r\nCo-authored-by: Gerald Shen ","shortMessageHtmlLink":"Implement the reward aware preference optimization algorithms. (#195)"}},{"before":null,"after":"8d8ef38bc7b190d9a3d0b5face76147b9e0ae863","ref":"refs/heads/terryk/str-generate","pushedAt":"2024-07-03T18:27:18.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"terrykong","name":"Terry Kong","path":"/terrykong","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7576060?s=80&v=4"},"commit":{"message":"fix broken tutorial link (#223)\n\nSigned-off-by: Gerald Shen ","shortMessageHtmlLink":"fix broken tutorial link (#223)"}},{"before":"f60ea0a6b05892da23f852c4f1dd6864cd00eeb5","after":"b0f6d559e40131396aafb71b57823444bf4523b8","ref":"refs/heads/cai","pushedAt":"2024-07-03T17:36:36.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"gleibovich-nvidia","name":null,"path":"/gleibovich-nvidia","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/150582838?s=80&v=4"},"commit":{"message":"CAI.rst -> cai.rst also on index.rst\n\nSigned-off-by: Gal Leibovich ","shortMessageHtmlLink":"CAI.rst -> cai.rst also on index.rst"}},{"before":"6dd0a87b6321924e97bdc6868a82bdc2c1ebb1f2","after":"f60ea0a6b05892da23f852c4f1dd6864cd00eeb5","ref":"refs/heads/cai","pushedAt":"2024-07-03T17:07:46.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"gleibovich-nvidia","name":null,"path":"/gleibovich-nvidia","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/150582838?s=80&v=4"},"commit":{"message":"CAI.rst -> cai.rst\n\nSigned-off-by: Gal Leibovich ","shortMessageHtmlLink":"CAI.rst -> cai.rst"}},{"before":"fdfb16178cb856321919a0b885181a62848d6534","after":"f926a39da2e992726c510cef40d8316dd3fb1b19","ref":"refs/heads/ssy/reward-aware-po","pushedAt":"2024-07-03T15:42:57.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"shengyangs","name":"Shengyang Sun","path":"/shengyangs","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/150360624?s=80&v=4"},"commit":{"message":"fix rpo default reward config\n\nSigned-off-by: Shengyang Sun ","shortMessageHtmlLink":"fix rpo default reward config"}},{"before":"fc769a69d9762efa32ca893174a62bdb2e3f8728","after":"6dd0a87b6321924e97bdc6868a82bdc2c1ebb1f2","ref":"refs/heads/cai","pushedAt":"2024-07-03T12:10:21.000Z","pushType":"push","commitsCount":4,"pusher":{"login":"gleibovich-nvidia","name":null,"path":"/gleibovich-nvidia","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/150582838?s=80&v=4"},"commit":{"message":"Merge branch 'main' into cai\n\nSigned-off-by: Gal Leibovich ","shortMessageHtmlLink":"Merge branch 'main' into cai"}},{"before":"a13651dd65bf31ef169fa305eb8acbaf010f4b47","after":"fc769a69d9762efa32ca893174a62bdb2e3f8728","ref":"refs/heads/cai","pushedAt":"2024-07-03T11:28:41.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"gleibovich-nvidia","name":null,"path":"/gleibovich-nvidia","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/150582838?s=80&v=4"},"commit":{"message":"rst bug fix\n\nSigned-off-by: Gal Leibovich ","shortMessageHtmlLink":"rst bug fix"}},{"before":"621d3f0bd0f08257d95abed911eadf93f2ad4fcf","after":"a13651dd65bf31ef169fa305eb8acbaf010f4b47","ref":"refs/heads/cai","pushedAt":"2024-07-03T11:02:04.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"snisimov","name":null,"path":"/snisimov","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/150595186?s=80&v=4"},"commit":{"message":"minor\n\nSigned-off-by: shami nisimov ","shortMessageHtmlLink":"minor"}},{"before":"0c91e21f317423aba8344441933bb1779ca66d77","after":"621d3f0bd0f08257d95abed911eadf93f2ad4fcf","ref":"refs/heads/cai","pushedAt":"2024-07-03T10:54:16.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"pre-commit-ci[bot]","name":null,"path":"/apps/pre-commit-ci","primaryAvatarUrl":"https://avatars.githubusercontent.com/in/68672?s=80&v=4"},"commit":{"message":"[pre-commit.ci] auto fixes from pre-commit.com hooks\n\nfor more information, see https://pre-commit.ci","shortMessageHtmlLink":"[pre-commit.ci] auto fixes from pre-commit.com hooks"}},{"before":"b2e1f6e1bf75178babd926acce189b91f156c084","after":"0c91e21f317423aba8344441933bb1779ca66d77","ref":"refs/heads/cai","pushedAt":"2024-07-03T10:53:58.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"snisimov","name":null,"path":"/snisimov","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/150595186?s=80&v=4"},"commit":{"message":"integrated changes from PR #9354 in NeMo (Chat template support for megatron_gpt_eval.py).\n\nSigned-off-by: shami nisimov ","shortMessageHtmlLink":"integrated changes from PR #9354 in NeMo (Chat template support for m…"}},{"before":null,"after":"a58f2ff97ea0d072069a344ddce1ab1df174fc18","ref":"refs/heads/terryk/export-rollouts-jsonl","pushedAt":"2024-07-03T06:20:59.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"terrykong","name":"Terry Kong","path":"/terrykong","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7576060?s=80&v=4"},"commit":{"message":"Adds flag to dump rollouts to jsonl file","shortMessageHtmlLink":"Adds flag to dump rollouts to jsonl file"}},{"before":"ce7a07fdc6238150af8310e039005cebb91d9f9e","after":null,"ref":"refs/heads/terryk/export-rollouts-jsonl","pushedAt":"2024-07-03T06:17:30.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"terrykong","name":"Terry Kong","path":"/terrykong","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7576060?s=80&v=4"}},{"before":null,"after":"ce7a07fdc6238150af8310e039005cebb91d9f9e","ref":"refs/heads/terryk/export-rollouts-jsonl","pushedAt":"2024-07-03T06:01:03.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"terrykong","name":"Terry Kong","path":"/terrykong","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7576060?s=80&v=4"},"commit":{"message":"cleanup communicator clean\n\nSigned-off-by: Gerald Shen ","shortMessageHtmlLink":"cleanup communicator clean"}},{"before":"ec548b8ed9a0ad781a4a025980d61e4291996371","after":"ce7a07fdc6238150af8310e039005cebb91d9f9e","ref":"refs/heads/geshen/trt_llm_to_main","pushedAt":"2024-07-03T00:25:46.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"gshennvm","name":"Gerald Shen","path":"/gshennvm","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119401249?s=80&v=4"},"commit":{"message":"cleanup communicator clean\n\nSigned-off-by: Gerald Shen ","shortMessageHtmlLink":"cleanup communicator clean"}},{"before":"4d0853dd876c8b07203f973c30ffca6fc41a6aef","after":"ec548b8ed9a0ad781a4a025980d61e4291996371","ref":"refs/heads/geshen/trt_llm_to_main","pushedAt":"2024-07-03T00:20:27.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"gshennvm","name":"Gerald Shen","path":"/gshennvm","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/119401249?s=80&v=4"},"commit":{"message":"add nemo guard for when things don't stop properly\n\nSigned-off-by: Gerald Shen ","shortMessageHtmlLink":"add nemo guard for when things don't stop properly"}},{"before":"2d0c7560c7fcc2959effabee696368ba4dde080b","after":"550e7d43eaae2a05dfa335762346a12e3a6a4067","ref":"refs/heads/pre-commit-ci-update-config","pushedAt":"2024-07-02T00:18:20.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"pre-commit-ci[bot]","name":null,"path":"/apps/pre-commit-ci","primaryAvatarUrl":"https://avatars.githubusercontent.com/in/68672?s=80&v=4"},"commit":{"message":"[pre-commit.ci] pre-commit suggestions\n\nupdates:\n- [github.com/pre-commit/pre-commit-hooks: v4.3.0 → v4.6.0](https://github.com/pre-commit/pre-commit-hooks/compare/v4.3.0...v4.6.0)\n- [github.com/PyCQA/isort: 5.12.0 → 5.13.2](https://github.com/PyCQA/isort/compare/5.12.0...5.13.2)\n- [github.com/psf/black: 19.10b0 → 24.4.2](https://github.com/psf/black/compare/19.10b0...24.4.2)","shortMessageHtmlLink":"[pre-commit.ci] pre-commit suggestions"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEd0ocvgA","startCursor":null,"endCursor":null}},"title":"Activity · NVIDIA/NeMo-Aligner"}