{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":679218428,"defaultBranch":"main","name":"RWKV-infctx-trainer","ownerLogin":"RWKV","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2023-08-16T11:01:34.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/132652788?v=4","public":true,"private":false,"isOrgOwned":true},"refInfo":{"name":"","listCacheKey":"v0:1715870053.0","currentOid":""},"activityList":{"items":[{"before":"b2e191907c43a640c24d6078dffacdb64337618e","after":"eb9ae540e05c64633732149dd98c3d52df76dd7a","ref":"refs/heads/m8than-fix-variable-length","pushedAt":"2024-05-16T14:41:09.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"m8than","name":"Nathan","path":"/m8than","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/23742732?s=80&v=4"},"commit":{"message":"Update model.py","shortMessageHtmlLink":"Update model.py"}},{"before":"d45e3ce72384ad947e4d6b31c95d8adaa92c969d","after":"b2e191907c43a640c24d6078dffacdb64337618e","ref":"refs/heads/m8than-fix-variable-length","pushedAt":"2024-05-16T14:38:56.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"m8than","name":"Nathan","path":"/m8than","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/23742732?s=80&v=4"},"commit":{"message":"Update model.py","shortMessageHtmlLink":"Update model.py"}},{"before":"ef2f4582e89cb131a0e457976ece8d67465c9970","after":"d45e3ce72384ad947e4d6b31c95d8adaa92c969d","ref":"refs/heads/m8than-fix-variable-length","pushedAt":"2024-05-16T14:35:16.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"m8than","name":"Nathan","path":"/m8than","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/23742732?s=80&v=4"},"commit":{"message":"Update model.py","shortMessageHtmlLink":"Update model.py"}},{"before":"67036ed569599542a39487ebb42b5cec1d83e1e7","after":null,"ref":"refs/heads/m8than-variable-doc-length","pushedAt":"2024-05-16T14:34:13.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"m8than","name":"Nathan","path":"/m8than","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/23742732?s=80&v=4"}},{"before":null,"after":"67036ed569599542a39487ebb42b5cec1d83e1e7","ref":"refs/heads/m8than-variable-doc-length","pushedAt":"2024-05-16T14:31:04.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"m8than","name":"Nathan","path":"/m8than","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/23742732?s=80&v=4"},"commit":{"message":"Update model.py\n\nFix variable length document training","shortMessageHtmlLink":"Update model.py"}},{"before":"b913716d21bb3a3f44d2834a721859f1aff8f6aa","after":"5e3d7489c632908b4a2ff80e317d822838124618","ref":"refs/heads/rwkv-x5-stateTune","pushedAt":"2024-05-13T21:25:10.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"PicoCreator","name":"Eugene Cheah","path":"/PicoCreator","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17175484?s=80&v=4"},"commit":{"message":"WIP state tune implement","shortMessageHtmlLink":"WIP state tune implement"}},{"before":"a3e393fe3e1b482e0a3cb16062ac016390d8a2ab","after":"b913716d21bb3a3f44d2834a721859f1aff8f6aa","ref":"refs/heads/rwkv-x5-stateTune","pushedAt":"2024-05-04T09:30:35.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"PicoCreator","name":"Eugene Cheah","path":"/PicoCreator","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17175484?s=80&v=4"},"commit":{"message":"state tune POC","shortMessageHtmlLink":"state tune POC"}},{"before":"46c127798e3ac1815b6ba502b439575978ac5247","after":"a3e393fe3e1b482e0a3cb16062ac016390d8a2ab","ref":"refs/heads/rwkv-x5-stateTune","pushedAt":"2024-05-04T09:23:33.000Z","pushType":"push","commitsCount":3,"pusher":{"login":"PicoCreator","name":"Eugene Cheah","path":"/PicoCreator","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17175484?s=80&v=4"},"commit":{"message":"prototype state tuning support with wkv_state","shortMessageHtmlLink":"prototype state tuning support with wkv_state"}},{"before":"93bba238d4bb63d1151cb8fa6ef0d30b34a151ba","after":"46c127798e3ac1815b6ba502b439575978ac5247","ref":"refs/heads/rwkv-x5-stateTune","pushedAt":"2024-05-03T12:47:36.000Z","pushType":"pr_merge","commitsCount":26,"pusher":{"login":"PicoCreator","name":"Eugene Cheah","path":"/PicoCreator","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17175484?s=80&v=4"},"commit":{"message":"Merge pull request #99 from RWKV/rwkv-x5-segmentedLoss\n\nRwkv x5 segmented loss","shortMessageHtmlLink":"Merge pull request #99 from RWKV/rwkv-x5-segmentedLoss"}},{"before":"71b395d84880a6556aaf0fba09e2dcb4c3f8dff5","after":"0f1b50b6f43b1a365b4dbacecdbada59407a6917","ref":"refs/heads/rwkv-x5-segmentedLoss","pushedAt":"2024-05-03T12:36:04.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"PicoCreator","name":"Eugene Cheah","path":"/PicoCreator","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17175484?s=80&v=4"},"commit":{"message":"Merge pull request #95 from neurallambda/fix-tokenizer\n\nFix trie-tokenizer decoding","shortMessageHtmlLink":"Merge pull request #95 from neurallambda/fix-tokenizer"}},{"before":"1d0d964631bda7d19e172236771a0487e1fe1bb8","after":"71b395d84880a6556aaf0fba09e2dcb4c3f8dff5","ref":"refs/heads/rwkv-x5-segmentedLoss","pushedAt":"2024-05-03T12:34:50.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"PicoCreator","name":"Eugene Cheah","path":"/PicoCreator","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17175484?s=80&v=4"},"commit":{"message":"Added full_segmented_loss flag","shortMessageHtmlLink":"Added full_segmented_loss flag"}},{"before":"70d02c4997578a027d110e3acb03a523d3986448","after":"1d0d964631bda7d19e172236771a0487e1fe1bb8","ref":"refs/heads/rwkv-x5-segmentedLoss","pushedAt":"2024-05-03T08:51:03.000Z","pushType":"pr_merge","commitsCount":6,"pusher":{"login":"PicoCreator","name":"Eugene Cheah","path":"/PicoCreator","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17175484?s=80&v=4"},"commit":{"message":"Merge pull request #97 from RWKV/m8than-fix-variable-length\n\nFixed 0 loss issue + changed segment loss algorithm to base learning rate on ctx length rather than document length.","shortMessageHtmlLink":"Merge pull request #97 from RWKV/m8than-fix-variable-length"}},{"before":null,"after":"70d02c4997578a027d110e3acb03a523d3986448","ref":"refs/heads/rwkv-x5-segmentedLoss","pushedAt":"2024-05-03T08:50:15.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"PicoCreator","name":"Eugene Cheah","path":"/PicoCreator","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17175484?s=80&v=4"},"commit":{"message":"Merge pull request #96 from RWKV/m8than-fix-variable-length\n\nVariable length dataset fix, (0 length input fix)","shortMessageHtmlLink":"Merge pull request #96 from RWKV/m8than-fix-variable-length"}},{"before":null,"after":"93bba238d4bb63d1151cb8fa6ef0d30b34a151ba","ref":"refs/heads/rwkv-x5-stateTune","pushedAt":"2024-05-03T08:37:24.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"PicoCreator","name":"Eugene Cheah","path":"/PicoCreator","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17175484?s=80&v=4"},"commit":{"message":"enwiki v5 test","shortMessageHtmlLink":"enwiki v5 test"}},{"before":"048f05de79ade1bfba15c2f380d236526d7a2fef","after":"e2704ac45b26fcd763bd10ad6f1f1c472b6d7c5d","ref":"refs/heads/rwkv-x6-layerNbits","pushedAt":"2024-05-03T05:59:55.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"PicoCreator","name":"Eugene Cheah","path":"/PicoCreator","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17175484?s=80&v=4"},"commit":{"message":"MQT L24","shortMessageHtmlLink":"MQT L24"}},{"before":"427895dfd48228eac8d8e2f5111afde6b0b88b2d","after":"1347e5c5aa6bb74952c70bf47132c98dc152779f","ref":"refs/heads/rwkv-6-support","pushedAt":"2024-05-01T17:03:10.000Z","pushType":"push","commitsCount":7,"pusher":{"login":"SmerkyG","name":null,"path":"/SmerkyG","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/8826350?s=80&v=4"},"commit":{"message":"metrics update, model updates to match v5","shortMessageHtmlLink":"metrics update, model updates to match v5"}},{"before":"24efc87f148ec2434d314284cdb8c6d53d112a1c","after":"427895dfd48228eac8d8e2f5111afde6b0b88b2d","ref":"refs/heads/rwkv-6-support","pushedAt":"2024-05-01T17:02:00.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"SmerkyG","name":null,"path":"/SmerkyG","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/8826350?s=80&v=4"},"commit":{"message":"metrics patch, model updates to match v5","shortMessageHtmlLink":"metrics patch, model updates to match v5"}},{"before":null,"after":"19549b920367db830964cefd5745a9f7c76119b3","ref":"refs/heads/rwkv-x6-layerNbits-b1","pushedAt":"2024-05-01T10:56:01.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"PicoCreator","name":"Eugene Cheah","path":"/PicoCreator","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17175484?s=80&v=4"},"commit":{"message":"somehow things broke?","shortMessageHtmlLink":"somehow things broke?"}},{"before":"e4084a0408d298a384be5c9b745ced10407af8b6","after":"048f05de79ade1bfba15c2f380d236526d7a2fef","ref":"refs/heads/rwkv-x6-layerNbits","pushedAt":"2024-05-01T10:13:57.000Z","pushType":"push","commitsCount":5,"pusher":{"login":"PicoCreator","name":"Eugene Cheah","path":"/PicoCreator","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17175484?s=80&v=4"},"commit":{"message":"WIP L24 test","shortMessageHtmlLink":"WIP L24 test"}},{"before":"724271d9062218ad0332e975d3b5fd9fcec94410","after":"ef2f4582e89cb131a0e457976ece8d67465c9970","ref":"refs/heads/m8than-fix-variable-length","pushedAt":"2024-04-26T22:25:10.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"m8than","name":"Nathan","path":"/m8than","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/23742732?s=80&v=4"},"commit":{"message":"full segmented loss","shortMessageHtmlLink":"full segmented loss"}},{"before":"ca2cc11d34069216b39627a0c04adfa762885217","after":"724271d9062218ad0332e975d3b5fd9fcec94410","ref":"refs/heads/m8than-fix-variable-length","pushedAt":"2024-04-26T22:22:33.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"m8than","name":"Nathan","path":"/m8than","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/23742732?s=80&v=4"},"commit":{"message":"Update config-example.yaml","shortMessageHtmlLink":"Update config-example.yaml"}},{"before":"be27fdbe63299417f53abc265974f7726d4e3c3d","after":"ca2cc11d34069216b39627a0c04adfa762885217","ref":"refs/heads/m8than-fix-variable-length","pushedAt":"2024-04-26T18:55:58.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"m8than","name":"Nathan","path":"/m8than","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/23742732?s=80&v=4"},"commit":{"message":"loss/lr based on segment size/ctx length now instead","shortMessageHtmlLink":"loss/lr based on segment size/ctx length now instead"}},{"before":"ddc8c4c9472f8f29998c7a84e6184469a6784ba7","after":"be27fdbe63299417f53abc265974f7726d4e3c3d","ref":"refs/heads/m8than-fix-variable-length","pushedAt":"2024-04-26T15:40:53.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"m8than","name":"Nathan","path":"/m8than","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/23742732?s=80&v=4"},"commit":{"message":"fix 0 train loss hang","shortMessageHtmlLink":"fix 0 train loss hang"}},{"before":"b38cb52dab819063a69352985f7e3102d9d86b9b","after":"ddc8c4c9472f8f29998c7a84e6184469a6784ba7","ref":"refs/heads/m8than-fix-variable-length","pushedAt":"2024-04-25T23:25:15.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"m8than","name":"Nathan","path":"/m8than","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/23742732?s=80&v=4"},"commit":{"message":"fix large variations in data sequence length","shortMessageHtmlLink":"fix large variations in data sequence length"}},{"before":"a5a2b2c673cecf419adc3535bf1aec7696b0ccf6","after":"e4084a0408d298a384be5c9b745ced10407af8b6","ref":"refs/heads/rwkv-x6-layerNbits","pushedAt":"2024-04-25T19:49:53.000Z","pushType":"push","commitsCount":4,"pusher":{"login":"PicoCreator","name":"Eugene Cheah","path":"/PicoCreator","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17175484?s=80&v=4"},"commit":{"message":"porting nathans mixed dataset size fix","shortMessageHtmlLink":"porting nathans mixed dataset size fix"}},{"before":"a80a0f767e41675b19fd46896d63b1ee4fbee2de","after":"70d02c4997578a027d110e3acb03a523d3986448","ref":"refs/heads/main","pushedAt":"2024-04-25T19:47:42.000Z","pushType":"pr_merge","commitsCount":3,"pusher":{"login":"PicoCreator","name":"Eugene Cheah","path":"/PicoCreator","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17175484?s=80&v=4"},"commit":{"message":"Merge pull request #96 from RWKV/m8than-fix-variable-length\n\nVariable length dataset fix, (0 length input fix)","shortMessageHtmlLink":"Merge pull request #96 from RWKV/m8than-fix-variable-length"}},{"before":"e1ce8eb85c7b1b73a4798e7b4aada517cd215364","after":"268879d6d7c28b1e0e95f6ea1d79abccbf1ccade","ref":"refs/heads/rwkv-experimental","pushedAt":"2024-04-25T19:46:29.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"SmerkyG","name":null,"path":"/SmerkyG","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/8826350?s=80&v=4"},"commit":{"message":"bugfix for cos lr\n\n(cherry picked from commit 4bf0aa29be646a30ab997e790fb1fd6e090bd458)","shortMessageHtmlLink":"bugfix for cos lr"}},{"before":"3eb0d2f60f216b182896c8476c8b40e2f6b83359","after":"4bf0aa29be646a30ab997e790fb1fd6e090bd458","ref":"refs/heads/rwkv-experimental-hash","pushedAt":"2024-04-25T19:46:06.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"SmerkyG","name":null,"path":"/SmerkyG","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/8826350?s=80&v=4"},"commit":{"message":"bugfix for cos lr","shortMessageHtmlLink":"bugfix for cos lr"}},{"before":"ae2e89073697f17ee2d761ca129decc6e7dc296f","after":"b38cb52dab819063a69352985f7e3102d9d86b9b","ref":"refs/heads/m8than-fix-variable-length","pushedAt":"2024-04-25T19:13:19.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"m8than","name":"Nathan","path":"/m8than","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/23742732?s=80&v=4"},"commit":{"message":"Update model.py","shortMessageHtmlLink":"Update model.py"}},{"before":null,"after":"ae2e89073697f17ee2d761ca129decc6e7dc296f","ref":"refs/heads/m8than-fix-variable-length","pushedAt":"2024-04-25T18:28:38.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"m8than","name":"Nathan","path":"/m8than","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/23742732?s=80&v=4"},"commit":{"message":"Variable length dataset fix, (0 length input fix)","shortMessageHtmlLink":"Variable length dataset fix, (0 length input fix)"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"startCursor":"Y3Vyc29yOnYyOpK7MjAyNC0wNS0xNlQxNDo0MTowOS4wMDAwMDBazwAAAARLvln2","endCursor":"Y3Vyc29yOnYyOpK7MjAyNC0wNC0yNVQxODoyODozOC4wMDAwMDBazwAAAAQ6eTz4"}},"title":"Activity ยท RWKV/RWKV-infctx-trainer"}