{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":785617449,"defaultBranch":"main","name":"InfiniTransformer","ownerLogin":"Beomi","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2024-04-12T08:55:57.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/11323660?v=4","public":true,"private":false,"isOrgOwned":false},"refInfo":{"name":"","listCacheKey":"v0:1713365472.0","currentOid":""},"activityList":{"items":[{"before":"3ca7fd5f7faaa9382cba6a98227a436e06be37fd","after":"045f4eba17a3155dbdc255d76b4623bebc768eb6","ref":"refs/heads/main","pushedAt":"2024-04-23T07:25:49.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Fix typo at README.md (#19)\n\nImplemenation -> Implementation","shortMessageHtmlLink":"Fix typo at README.md (#19)"}},{"before":"1f1ff444b7aa2d37a5dc5852e5aabb7e563b141e","after":"3ca7fd5f7faaa9382cba6a98227a436e06be37fd","ref":"refs/heads/main","pushedAt":"2024-04-21T13:18:17.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Minor fix typo in `dtype_memory_size_dict` (#18)\n\n* minor fix typo gpu_mem_track.py\r\n\r\nre-ordered memory size and fix typo about torch.short","shortMessageHtmlLink":"Minor fix typo in dtype_memory_size_dict (#18)"}},{"before":"41af75be3aceeb9e106038fb01dbdf9ed2da5760","after":"1f1ff444b7aa2d37a5dc5852e5aabb7e563b141e","ref":"refs/heads/main","pushedAt":"2024-04-19T08:36:18.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Set accelerate --num_processes=1 when training","shortMessageHtmlLink":"Set accelerate --num_processes=1 when training"}},{"before":"a5c3a912e0afff1c975408a0b9c3d4a08989631d","after":"41af75be3aceeb9e106038fb01dbdf9ed2da5760","ref":"refs/heads/main","pushedAt":"2024-04-19T06:48:25.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Update README.md","shortMessageHtmlLink":"Update README.md"}},{"before":"38f81bfa6c0ae11eb932e37066b18e0597632bf5","after":"a5c3a912e0afff1c975408a0b9c3d4a08989631d","ref":"refs/heads/main","pushedAt":"2024-04-19T06:46:38.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Update README.md","shortMessageHtmlLink":"Update README.md"}},{"before":"44dedfbc15f9acbb06aad63e5239f461b1510551","after":"38f81bfa6c0ae11eb932e37066b18e0597632bf5","ref":"refs/heads/main","pushedAt":"2024-04-19T06:41:22.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Update README.md","shortMessageHtmlLink":"Update README.md"}},{"before":"a286b1c4a50614ae1dde0a9e9d5e35b472cc3697","after":"44dedfbc15f9acbb06aad63e5239f461b1510551","ref":"refs/heads/main","pushedAt":"2024-04-19T06:40:27.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Add Infini-Llama3, with model/train codes. Resolve #3","shortMessageHtmlLink":"Add Infini-Llama3, with model/train codes. Resolve #3"}},{"before":"bbb6a1044bf2ef7747456a0df00ee890ce043bb2","after":"a286b1c4a50614ae1dde0a9e9d5e35b472cc3697","ref":"refs/heads/main","pushedAt":"2024-04-19T02:20:22.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Add Inference code, Resolve #16","shortMessageHtmlLink":"Add Inference code, Resolve #16"}},{"before":"4498c4ee58903496d936ed89d77b1cbe1db79154","after":"bbb6a1044bf2ef7747456a0df00ee890ce043bb2","ref":"refs/heads/main","pushedAt":"2024-04-18T05:58:07.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Add train.gemma.infini.noclm.32k.sh","shortMessageHtmlLink":"Add train.gemma.infini.noclm.32k.sh"}},{"before":"34114193d409b1fc99d15a1d5eaf6610fcc3af85","after":"4498c4ee58903496d936ed89d77b1cbe1db79154","ref":"refs/heads/main","pushedAt":"2024-04-18T05:45:09.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Add wandb logging","shortMessageHtmlLink":"Add wandb logging"}},{"before":"03b4b88af3e57c5e66a5472d5844465c3768e2dd","after":"34114193d409b1fc99d15a1d5eaf6610fcc3af85","ref":"refs/heads/main","pushedAt":"2024-04-18T05:32:36.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"no use cuda visible devices on train script","shortMessageHtmlLink":"no use cuda visible devices on train script"}},{"before":"234f4a6c6e5a83401d3d3221d5bca5fe7310f7ae","after":"03b4b88af3e57c5e66a5472d5844465c3768e2dd","ref":"refs/heads/main","pushedAt":"2024-04-18T05:31:24.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Add logging with wandb","shortMessageHtmlLink":"Add logging with wandb"}},{"before":"4bc7899e4ca275207417a61c803cad470655cfb0","after":"234f4a6c6e5a83401d3d3221d5bca5fe7310f7ae","ref":"refs/heads/main","pushedAt":"2024-04-18T05:24:17.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Memory does not use PE(Fix #15), Memory/Norm per layer(Fix #14)","shortMessageHtmlLink":"Memory does not use PE(Fix #15), Memory/Norm per layer(Fix #14)"}},{"before":"bd2bc882e07a9e942e3685e5dcdf7c4df08b5444","after":"4bc7899e4ca275207417a61c803cad470655cfb0","ref":"refs/heads/main","pushedAt":"2024-04-18T03:08:37.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Update README.md","shortMessageHtmlLink":"Update README.md"}},{"before":"7a5f1494cb27549f62ac62677a5996cb4fc0b23f","after":"bd2bc882e07a9e942e3685e5dcdf7c4df08b5444","ref":"refs/heads/main","pushedAt":"2024-04-18T03:03:23.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"fix typo","shortMessageHtmlLink":"fix typo"}},{"before":"7fef857a464321c1ed62a660c9d77b1d590a3874","after":"7a5f1494cb27549f62ac62677a5996cb4fc0b23f","ref":"refs/heads/main","pushedAt":"2024-04-18T02:49:57.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"model train in FP32 for stability","shortMessageHtmlLink":"model train in FP32 for stability"}},{"before":"26972792e6473578635891367287eeecf9a1bb9e","after":"7fef857a464321c1ed62a660c9d77b1d590a3874","ref":"refs/heads/main","pushedAt":"2024-04-18T02:09:06.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"fix nan loss bug","shortMessageHtmlLink":"fix nan loss bug"}},{"before":"f228fbaba9499e2984208e0d226125569d5a7913","after":"26972792e6473578635891367287eeecf9a1bb9e","ref":"refs/heads/main","pushedAt":"2024-04-18T01:45:27.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Merge branch 'main' of github.com:Beomi/InfiniTransformer","shortMessageHtmlLink":"Merge branch 'main' of github.com:Beomi/InfiniTransformer"}},{"before":"ef964011da01be4728a0434e213c59aed51c3ef4","after":"f228fbaba9499e2984208e0d226125569d5a7913","ref":"refs/heads/main","pushedAt":"2024-04-18T01:36:15.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Update README.md","shortMessageHtmlLink":"Update README.md"}},{"before":"9406c53775bbf106fb9ff61cf72942a76808bf9c","after":"ef964011da01be4728a0434e213c59aed51c3ef4","ref":"refs/heads/main","pushedAt":"2024-04-17T15:08:00.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Remove WIP","shortMessageHtmlLink":"Remove WIP"}},{"before":"e481131f1f0f0d68b802a161f975600b63f1c8b4","after":"9406c53775bbf106fb9ff61cf72942a76808bf9c","ref":"refs/heads/main","pushedAt":"2024-04-17T15:01:58.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Update README.md","shortMessageHtmlLink":"Update README.md"}},{"before":"6b2b5023c3c3a910161d896af40edf45d1e550e9","after":"e481131f1f0f0d68b802a161f975600b63f1c8b4","ref":"refs/heads/main","pushedAt":"2024-04-17T15:00:08.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Update README.md","shortMessageHtmlLink":"Update README.md"}},{"before":"6f7e0412eb0ba3b0ef2d4b83e28d6d061a50b31b","after":null,"ref":"refs/heads/memory-optimize","pushedAt":"2024-04-17T14:51:12.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"}},{"before":"f755fc2e4295ad9d29003f9bc3cad88a7e9138b8","after":"6b2b5023c3c3a910161d896af40edf45d1e550e9","ref":"refs/heads/main","pushedAt":"2024-04-17T14:51:07.000Z","pushType":"pr_merge","commitsCount":8,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Merge pull request #12 from Beomi/memory-optimize\n\nAdd Memory optimized model","shortMessageHtmlLink":"Merge pull request #12 from Beomi/memory-optimize"}},{"before":"794de70d3ee28576e41b24845e0ca78bc0945d30","after":"6f7e0412eb0ba3b0ef2d4b83e28d6d061a50b31b","ref":"refs/heads/memory-optimize","pushedAt":"2024-04-17T14:50:17.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"train works with 2048*16=32768 seq len","shortMessageHtmlLink":"train works with 2048*16=32768 seq len"}},{"before":"c38298c2144ee40ac187679e546d8950d4f316de","after":"794de70d3ee28576e41b24845e0ca78bc0945d30","ref":"refs/heads/memory-optimize","pushedAt":"2024-04-17T14:35:53.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Should I retrain graph?","shortMessageHtmlLink":"Should I retrain graph?"}},{"before":"88899721aec0b6d5f9840d02a13ececcdb713297","after":"c38298c2144ee40ac187679e546d8950d4f316de","ref":"refs/heads/memory-optimize","pushedAt":"2024-04-17T14:29:38.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Fix typo","shortMessageHtmlLink":"Fix typo"}},{"before":"b031abc271d94dcc2d2a4cd5fa0c612465ecb3cd","after":"88899721aec0b6d5f9840d02a13ececcdb713297","ref":"refs/heads/memory-optimize","pushedAt":"2024-04-17T14:28:59.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Fix typo","shortMessageHtmlLink":"Fix typo"}},{"before":"206237ecd081143f5c4b4266f3c1dd633fca5e4c","after":"b031abc271d94dcc2d2a4cd5fa0c612465ecb3cd","ref":"refs/heads/memory-optimize","pushedAt":"2024-04-17T14:26:52.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Add train.gemma.infini.noclm","shortMessageHtmlLink":"Add train.gemma.infini.noclm"}},{"before":"fc910886d22c9fd7c99974c0f06acde81d75b506","after":"206237ecd081143f5c4b4266f3c1dd633fca5e4c","ref":"refs/heads/memory-optimize","pushedAt":"2024-04-17T13:57:32.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Beomi","name":"Junbum Lee","path":"/Beomi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/11323660?s=80&v=4"},"commit":{"message":"Add test train code for infini gemma","shortMessageHtmlLink":"Add test train code for infini gemma"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEN8TccwA","startCursor":null,"endCursor":null}},"title":"Activity ยท Beomi/InfiniTransformer"}