{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":506033104,"defaultBranch":"master","name":"k-diffusion","ownerLogin":"crowsonkb","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2022-06-21T23:22:46.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/4657022?v=4","public":true,"private":false,"isOrgOwned":false},"refInfo":{"name":"","listCacheKey":"v0:1701955618.0","currentOid":""},"activityList":{"items":[{"before":"6ab5146d4a5ef63901326489f31f1d8e7dd36b48","after":"21d12c91ad4550e8fcf3308ff9fe7116b3f19a08","ref":"refs/heads/master","pushedAt":"2024-05-06T18:44:25.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Add support for NATTEN 0.17.0 (fused neighborhood attention)","shortMessageHtmlLink":"Add support for NATTEN 0.17.0 (fused neighborhood attention)"}},{"before":"8ace775a8409f074fbfdd852f57b6de6f6440191","after":"6ab5146d4a5ef63901326489f31f1d8e7dd36b48","ref":"refs/heads/master","pushedAt":"2024-01-24T19:36:51.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Cast a to v's dtype in neighborhood attention blocks","shortMessageHtmlLink":"Cast a to v's dtype in neighborhood attention blocks"}},{"before":"cc49cf6182284e577e896943f8e29c7c9d1a7f2c","after":"8ace775a8409f074fbfdd852f57b6de6f6440191","ref":"refs/heads/master","pushedAt":"2024-01-23T00:54:42.000Z","pushType":"push","commitsCount":45,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Update README for transformer-model-v2","shortMessageHtmlLink":"Update README for transformer-model-v2"}},{"before":"0c6cc822e050e59d3e59128c57d350074969b267","after":"cc49cf6182284e577e896943f8e29c7c9d1a7f2c","ref":"refs/heads/master","pushedAt":"2023-12-07T13:28:55.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Add DOI badge to README","shortMessageHtmlLink":"Add DOI badge to README"}},{"before":"045515774882014cc14c1ba2668ab5bad9cbf7c0","after":"0c6cc822e050e59d3e59128c57d350074969b267","ref":"refs/heads/master","pushedAt":"2023-12-07T13:26:37.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Release 0.1.1.post1","shortMessageHtmlLink":"Release 0.1.1.post1"}},{"before":"f4cfe66ea10589062e2157d99654696beac2bf5f","after":"9737cfd85120cba1258b5b5b1dc6511356b5c924","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-10-28T14:23:48.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Fix flop counter","shortMessageHtmlLink":"Fix flop counter"}},{"before":"f9d5a59426c9d2c64810b05e4395977d9106fd40","after":"f4cfe66ea10589062e2157d99654696beac2bf5f","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-10-27T23:43:20.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Per level dropout rate","shortMessageHtmlLink":"Per level dropout rate"}},{"before":"11e69027f628128a49b5739e51ac38fb6d21358e","after":"f9d5a59426c9d2c64810b05e4395977d9106fd40","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-10-27T23:41:57.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"WIP flop counter","shortMessageHtmlLink":"WIP flop counter"}},{"before":"f4a74f1ec906cb62916f58288ec73ef0330ba446","after":"045515774882014cc14c1ba2668ab5bad9cbf7c0","ref":"refs/heads/master","pushedAt":"2023-10-10T06:47:29.000Z","pushType":"push","commitsCount":3,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Release 0.1.1","shortMessageHtmlLink":"Release 0.1.1"}},{"before":"962d28bf5306dfb4f36145301066702da38f8124","after":"11e69027f628128a49b5739e51ac38fb6d21358e","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-10-09T23:19:32.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Add --evaluate-only to train.py","shortMessageHtmlLink":"Add --evaluate-only to train.py"}},{"before":"8907fea5906b71887a859bffdef05041e4d1b142","after":"962d28bf5306dfb4f36145301066702da38f8124","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-10-09T18:38:55.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Weight decay token merge and split projections","shortMessageHtmlLink":"Weight decay token merge and split projections"}},{"before":"ccd801fb8a625d8a715476043c10d379b86c16a0","after":"8907fea5906b71887a859bffdef05041e4d1b142","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-10-09T18:24:26.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Don't spawn a bunch of processes on import","shortMessageHtmlLink":"Don't spawn a bunch of processes on import"}},{"before":"134015491a9fb2eb98e770f7d454d75c094fd436","after":"ccd801fb8a625d8a715476043c10d379b86c16a0","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-10-08T16:15:42.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Fix wall clock time counter","shortMessageHtmlLink":"Fix wall clock time counter"}},{"before":"de9bb2d1cc9b575c524c7fab6ee0a616870ef44b","after":"134015491a9fb2eb98e770f7d454d75c094fd436","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-10-06T23:30:36.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Default to no checkpointing if not in the checkpointing context manager","shortMessageHtmlLink":"Default to no checkpointing if not in the checkpointing context manager"}},{"before":"9a6e9f373c7a7644fa9cedd926b3f03da7d7942e","after":"de9bb2d1cc9b575c524c7fab6ee0a616870ef44b","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-10-05T16:59:46.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Avoid an extra allocation in apply_rotary_emb_()","shortMessageHtmlLink":"Avoid an extra allocation in apply_rotary_emb_()"}},{"before":"6b745a528554731867842a1b848e9b2700c0eaf7","after":"9a6e9f373c7a7644fa9cedd926b3f03da7d7942e","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-10-05T01:01:14.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Add 8-bit Adam","shortMessageHtmlLink":"Add 8-bit Adam"}},{"before":"b1748a8c7957dc1b60e84442a9e0ee820ca1fa9a","after":"6b745a528554731867842a1b848e9b2700c0eaf7","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-10-04T22:18:18.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Require PyTorch 2.1","shortMessageHtmlLink":"Require PyTorch 2.1"}},{"before":"46bd364bb4a41e5d3ae7a367ba7018271df98812","after":"b1748a8c7957dc1b60e84442a9e0ee820ca1fa9a","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-10-04T14:07:17.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Optimize apply_rotary_emb() further","shortMessageHtmlLink":"Optimize apply_rotary_emb() further"}},{"before":"e6760d3423fa707f2d452c1d84b032f17861c3e5","after":"46bd364bb4a41e5d3ae7a367ba7018271df98812","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-10-04T05:31:16.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Simplify apply_rotary_emb() etc","shortMessageHtmlLink":"Simplify apply_rotary_emb() etc"}},{"before":"fde0b4e263e10488efcd90d0b4f5eb54de9d24d7","after":"e6760d3423fa707f2d452c1d84b032f17861c3e5","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-10-03T20:51:55.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Use lru_cache on make_shifted_window_masks()","shortMessageHtmlLink":"Use lru_cache on make_shifted_window_masks()"}},{"before":"0e6bb3969c3d73e10d118c9e2deb0144b2906083","after":"fde0b4e263e10488efcd90d0b4f5eb54de9d24d7","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-10-03T20:30:09.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Change cos/sin axes to index from right consistently","shortMessageHtmlLink":"Change cos/sin axes to index from right consistently"}},{"before":"1b2bc7cecc62da1abb19cd0f06eeb4a75912857f","after":"0e6bb3969c3d73e10d118c9e2deb0144b2906083","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-10-03T13:56:26.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Fix rotary for non-flash attention","shortMessageHtmlLink":"Fix rotary for non-flash attention"}},{"before":"31d4bd271adf135f56d3c3f21740521a89e1e483","after":"1b2bc7cecc62da1abb19cd0f06eeb4a75912857f","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-10-02T19:57:38.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Different rotary freqs per head","shortMessageHtmlLink":"Different rotary freqs per head"}},{"before":"29c6a891ef9dfba236da8f907f82542f21d1cc62","after":"31d4bd271adf135f56d3c3f21740521a89e1e483","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-10-01T21:31:19.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Set default mapping network width to 256, allow configuring mapping network","shortMessageHtmlLink":"Set default mapping network width to 256, allow configuring mapping n…"}},{"before":"b4f9c6994231d1293243c1e43efa1448d5d4020e","after":"29c6a891ef9dfba236da8f907f82542f21d1cc62","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-10-01T21:13:19.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Set default mapping network width to 2, allow configuring mapping network","shortMessageHtmlLink":"Set default mapping network width to 2, allow configuring mapping net…"}},{"before":"71bc989cda99aa3d6d6e10e7ecb159753fad79b9","after":"b4f9c6994231d1293243c1e43efa1448d5d4020e","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-09-30T23:01:08.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Note that you have to install Hugging Face datasets for Oxford Flowers","shortMessageHtmlLink":"Note that you have to install Hugging Face datasets for Oxford Flowers"}},{"before":"0a109b35a41904b0152f88b919ea53f5913523ca","after":"71bc989cda99aa3d6d6e10e7ecb159753fad79b9","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-09-30T22:27:26.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Don't require pytorch nightly for shifted window attention","shortMessageHtmlLink":"Don't require pytorch nightly for shifted window attention"}},{"before":"6dac00688c6f1b06232743ec11942ed80c551f2d","after":"0a109b35a41904b0152f88b919ea53f5913523ca","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-09-30T22:17:50.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Update configs and README","shortMessageHtmlLink":"Update configs and README"}},{"before":"501f7cfa0376e5d402ad1c3a714b5506b246dc15","after":"6dac00688c6f1b06232743ec11942ed80c551f2d","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-09-30T19:52:36.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Print world size and batch size in train.py","shortMessageHtmlLink":"Print world size and batch size in train.py"}},{"before":"4c1093c0fb4cbb916b0d042f7ade279e53a5eefc","after":"501f7cfa0376e5d402ad1c3a714b5506b246dc15","ref":"refs/heads/transformer-model-v2","pushedAt":"2023-09-30T19:05:20.000Z","pushType":"push","commitsCount":3,"pusher":{"login":"crowsonkb","name":"Katherine Crowson","path":"/crowsonkb","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/4657022?s=80&v=4"},"commit":{"message":"Add shifted window attention","shortMessageHtmlLink":"Add shifted window attention"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEQtWY6wA","startCursor":null,"endCursor":null}},"title":"Activity · crowsonkb/k-diffusion"}