{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":155220641,"defaultBranch":"main","name":"transformers","ownerLogin":"huggingface","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2018-10-29T13:56:00.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/25720743?v=4","public":true,"private":false,"isOrgOwned":true},"refInfo":{"name":"","listCacheKey":"v0:1721168314.0","currentOid":""},"activityList":{"items":[{"before":"4c9e4c6acf2baa976434ece2046eb71ca57b2e5d","after":null,"ref":"refs/heads/muellerzr-more-failing","pushedAt":"2024-07-16T22:18:34.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"muellerzr","name":"Zach Mueller","path":"/muellerzr","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7831895?s=80&v=4"}},{"before":"6f40a213eb10e38a5f242d0645519d413d32d798","after":"4037a2b5b1278736e566aec12e169100275545ea","ref":"refs/heads/main","pushedAt":"2024-07-16T22:18:32.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"muellerzr","name":"Zach Mueller","path":"/muellerzr","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7831895?s=80&v=4"},"commit":{"message":"SpeechEncoderDecoder doesn't support param buffer assignments (#32009)\n\nOne more model","shortMessageHtmlLink":"SpeechEncoderDecoder doesn't support param buffer assignments (#32009)"}},{"before":null,"after":"4c9e4c6acf2baa976434ece2046eb71ca57b2e5d","ref":"refs/heads/muellerzr-more-failing","pushedAt":"2024-07-16T20:10:56.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"muellerzr","name":"Zach Mueller","path":"/muellerzr","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7831895?s=80&v=4"},"commit":{"message":"One more model","shortMessageHtmlLink":"One more model"}},{"before":"02769316bba50bf0b4bb3f03c9d329283e17cc75","after":null,"ref":"refs/heads/muellerzr-fix-fastinit","pushedAt":"2024-07-16T18:35:59.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"muellerzr","name":"Zach Mueller","path":"/muellerzr","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7831895?s=80&v=4"}},{"before":"e391706420934f6c87cebe9997fc85a757aa4353","after":"6f40a213eb10e38a5f242d0645519d413d32d798","ref":"refs/heads/main","pushedAt":"2024-07-16T18:35:57.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"muellerzr","name":"Zach Mueller","path":"/muellerzr","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7831895?s=80&v=4"},"commit":{"message":"Fix if else and *actually* enable superfast init (#32007)\n\n* Fix if else\r\n\r\n* rm err raise","shortMessageHtmlLink":"Fix if else and *actually* enable superfast init (#32007)"}},{"before":"c22efa61968a6aad93709594583610482b689836","after":"e391706420934f6c87cebe9997fc85a757aa4353","ref":"refs/heads/main","pushedAt":"2024-07-16T18:35:10.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"amyeroberts","name":null,"path":"/amyeroberts","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/22614925?s=80&v=4"},"commit":{"message":"Fix gather when collecting 'num_input_tokens_seen' (#31974)\n\n* Move token count to device before gathering\r\n\r\n* Run 'make style; make quality'","shortMessageHtmlLink":"Fix gather when collecting 'num_input_tokens_seen' (#31974)"}},{"before":"88e0813d8dde26b43a427c5d1a519f0e6ce3392f","after":"c22efa61968a6aad93709594583610482b689836","ref":"refs/heads/main","pushedAt":"2024-07-16T18:22:45.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"gante","name":"Joao Gante","path":"/gante","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/12240844?s=80&v=4"},"commit":{"message":"Bug report update -- round 2 (#32006)\n\n* like this?\r\n\r\n* Update .github/ISSUE_TEMPLATE/bug-report.yml\r\n\r\nCo-authored-by: amyeroberts <22614925+amyeroberts@users.noreply.github.com>\r\n\r\n---------\r\n\r\nCo-authored-by: amyeroberts <22614925+amyeroberts@users.noreply.github.com>","shortMessageHtmlLink":"Bug report update -- round 2 (#32006)"}},{"before":"11b4f148e43aad5cd1aa3049cca9e929bbea329d","after":"02769316bba50bf0b4bb3f03c9d329283e17cc75","ref":"refs/heads/muellerzr-fix-fastinit","pushedAt":"2024-07-16T17:24:17.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"muellerzr","name":"Zach Mueller","path":"/muellerzr","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7831895?s=80&v=4"},"commit":{"message":"rm err raise","shortMessageHtmlLink":"rm err raise"}},{"before":"9f06930e8ec513cf18992c425a6e26d3792a795b","after":"11b4f148e43aad5cd1aa3049cca9e929bbea329d","ref":"refs/heads/muellerzr-fix-fastinit","pushedAt":"2024-07-16T17:15:48.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"muellerzr","name":"Zach Mueller","path":"/muellerzr","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7831895?s=80&v=4"},"commit":{"message":"Right wording","shortMessageHtmlLink":"Right wording"}},{"before":"02769316bba50bf0b4bb3f03c9d329283e17cc75","after":"9f06930e8ec513cf18992c425a6e26d3792a795b","ref":"refs/heads/muellerzr-fix-fastinit","pushedAt":"2024-07-16T17:14:22.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"muellerzr","name":"Zach Mueller","path":"/muellerzr","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7831895?s=80&v=4"},"commit":{"message":"Fix test too","shortMessageHtmlLink":"Fix test too"}},{"before":"ed240ad0edb8250c8d6bed6528eb4630b3cf6ff5","after":"02769316bba50bf0b4bb3f03c9d329283e17cc75","ref":"refs/heads/muellerzr-fix-fastinit","pushedAt":"2024-07-16T16:55:45.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"muellerzr","name":"Zach Mueller","path":"/muellerzr","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7831895?s=80&v=4"},"commit":{"message":"rm err raise","shortMessageHtmlLink":"rm err raise"}},{"before":null,"after":"ed240ad0edb8250c8d6bed6528eb4630b3cf6ff5","ref":"refs/heads/muellerzr-fix-fastinit","pushedAt":"2024-07-16T16:51:53.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"muellerzr","name":"Zach Mueller","path":"/muellerzr","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7831895?s=80&v=4"},"commit":{"message":"Fix if else","shortMessageHtmlLink":"Fix if else"}},{"before":"036d3de23d8d682f5436bc36f6653d90b411c764","after":"88e0813d8dde26b43a427c5d1a519f0e6ce3392f","ref":"refs/heads/main","pushedAt":"2024-07-16T16:28:15.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"amyeroberts","name":null,"path":"/amyeroberts","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/22614925?s=80&v=4"},"commit":{"message":"fix: Fixed incorrect dictionary assignment in `src/transformers/__init__.py` (#31993)\n\nFixed incorrect dictionary assignment.","shortMessageHtmlLink":"fix: Fixed incorrect dictionary assignment in `src/transformers/__ini…"}},{"before":"89eec5cf2068cc871b094b60f66f19dd252cb6b3","after":"036d3de23d8d682f5436bc36f6653d90b411c764","ref":"refs/heads/main","pushedAt":"2024-07-16T15:55:41.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"ArthurZucker","name":"Arthur","path":"/ArthurZucker","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/48595927?s=80&v=4"},"commit":{"message":"add flash-attn deterministic option to flash-attn>=2.4.1 (#31961)\n\n* add flash-attn deterministic option to flash-attn>=2.4.1\r\n\r\n* Add Missing Import\r\n\r\n* Fix ruff linting issues\r\n\r\n* Replace `is_flash_attn_greater_or_equal_2_41` with the existing `is_flash_attn_greater_or_equal`\r\n\r\n---------\r\n\r\nCo-authored-by: jun.4 ","shortMessageHtmlLink":"add flash-attn deterministic option to flash-attn>=2.4.1 (#31961)"}},{"before":"999981daf4acf21cd80d843ee5069123aadf4796","after":"89eec5cf2068cc871b094b60f66f19dd252cb6b3","ref":"refs/heads/main","pushedAt":"2024-07-16T15:51:05.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"gante","name":"Joao Gante","path":"/gante","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/12240844?s=80&v=4"},"commit":{"message":"Bug report update (#31983)","shortMessageHtmlLink":"Bug report update (#31983)"}},{"before":"693cb828ff5e0e530db4f054092b6687439ede15","after":"999981daf4acf21cd80d843ee5069123aadf4796","ref":"refs/heads/main","pushedAt":"2024-07-16T15:49:54.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"gante","name":"Joao Gante","path":"/gante","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/12240844?s=80&v=4"},"commit":{"message":"Tests: remove cuda versions when the result is the same 🧹🧹 (#31955)\n\nremove cuda versions when the result is the same","shortMessageHtmlLink":"Tests: remove cuda versions when the result is the same 🧹🧹 (#31955)"}},{"before":"9ad0cce0f7f194f39d2389f1024f9eb9c848cf1d","after":null,"ref":"refs/heads/fix-slower-ish","pushedAt":"2024-07-16T14:33:07.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"muellerzr","name":"Zach Mueller","path":"/muellerzr","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7831895?s=80&v=4"}},{"before":"25e5e3fa56d73d07d6a1c46306a5f3f1fd862463","after":"693cb828ff5e0e530db4f054092b6687439ede15","ref":"refs/heads/main","pushedAt":"2024-07-16T14:33:05.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"muellerzr","name":"Zach Mueller","path":"/muellerzr","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7831895?s=80&v=4"},"commit":{"message":"Fix bad test about slower init (#32002)\n\nBronked main","shortMessageHtmlLink":"Fix bad test about slower init (#32002)"}},{"before":"e0dfd7bcaf7ff0723085f23244a755cc2ed92466","after":"25e5e3fa56d73d07d6a1c46306a5f3f1fd862463","ref":"refs/heads/main","pushedAt":"2024-07-16T14:11:37.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"ydshieh","name":"Yih-Dar","path":"/ydshieh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/2521628?s=80&v=4"},"commit":{"message":"[tests] fix deepspeed zero3 config for `test_stage3_nvme_offload` (#31881)\n\nfix config","shortMessageHtmlLink":"[tests] fix deepspeed zero3 config for test_stage3_nvme_offload (#3…"}},{"before":null,"after":"9ad0cce0f7f194f39d2389f1024f9eb9c848cf1d","ref":"refs/heads/fix-slower-ish","pushedAt":"2024-07-16T13:58:16.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"muellerzr","name":"Zach Mueller","path":"/muellerzr","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7831895?s=80&v=4"},"commit":{"message":"Bronked main","shortMessageHtmlLink":"Bronked main"}},{"before":"21af73ada1c26d31a8260feb8943026307fcea42","after":null,"ref":"refs/heads/muellerzr-speedup-inference","pushedAt":"2024-07-16T13:32:03.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"muellerzr","name":"Zach Mueller","path":"/muellerzr","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7831895?s=80&v=4"}},{"before":"03a3becc48f14a481b578c4d1c02273da9a1cc81","after":"e0dfd7bcaf7ff0723085f23244a755cc2ed92466","ref":"refs/heads/main","pushedAt":"2024-07-16T13:32:01.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"muellerzr","name":"Zach Mueller","path":"/muellerzr","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7831895?s=80&v=4"},"commit":{"message":"Speedup model init on CPU (by 10x+ for llama-3-8B as one example) (#31771)\n\n* 1,100%!\r\n\r\n* Clean\r\n\r\n* Don't touch DS\r\n\r\n* Experiment with dtype allocation\r\n\r\n* skip test_load_save_without_tied_weights test\r\n\r\n* A little faster\r\n\r\n* Include proper upscaling?\r\n\r\n* Fixup tests\r\n\r\n* Potentially skip?\r\n\r\n* Let's see if this fixes git history\r\n\r\n* Maintain new dtype\r\n\r\n* Fin\r\n\r\n* Rm hook idea for now\r\n\r\n* New approach, see what breaks\r\n\r\n* stage\r\n\r\n* Clean\r\n\r\n* Stash\r\n\r\n* Should be fin now, just need to mark failing models\r\n\r\n* Clean up\r\n\r\n* Simplify\r\n\r\n* Deal with weird models\r\n\r\n* Enc/Dec\r\n\r\n* Skip w/ reason\r\n\r\n* Adjust test\r\n\r\n* Fix test\r\n\r\n* one more test\r\n\r\n* Keep experimenting\r\n\r\n* Fix ref\r\n\r\n* TO REMOVE: testing feedback CI\r\n\r\n* Right push\r\n\r\n* Update tests/utils/test_modeling_utils.py\r\n\r\nCo-authored-by: Arthur <48595927+ArthurZucker@users.noreply.github.com>\r\n\r\n* disable\r\n\r\n* Add new func\r\n\r\n* Test nits from Amy\r\n\r\n* Update src/transformers/modeling_utils.py\r\n\r\nCo-authored-by: amyeroberts <22614925+amyeroberts@users.noreply.github.com>\r\n\r\n* Adjust comment\r\n\r\n* Adjust comment on skip\r\n\r\n* make private\r\n\r\n* Fin\r\n\r\n* Should be a not flag\r\n\r\n* Clarify and rename test\r\n\r\n---------\r\n\r\nCo-authored-by: Marc Sun \r\nCo-authored-by: Arthur <48595927+ArthurZucker@users.noreply.github.com>\r\nCo-authored-by: amyeroberts <22614925+amyeroberts@users.noreply.github.com>","shortMessageHtmlLink":"Speedup model init on CPU (by 10x+ for llama-3-8B as one example) (#3…"}},{"before":"70448cdff26887dbe8cee835ae20109dfbbf783f","after":"21af73ada1c26d31a8260feb8943026307fcea42","ref":"refs/heads/muellerzr-speedup-inference","pushedAt":"2024-07-16T12:56:04.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"muellerzr","name":"Zach Mueller","path":"/muellerzr","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7831895?s=80&v=4"},"commit":{"message":"Clarify and rename test","shortMessageHtmlLink":"Clarify and rename test"}},{"before":"1e5466a87d8cb0ecfccb2a3d799c74f6ebb00fae","after":"70448cdff26887dbe8cee835ae20109dfbbf783f","ref":"refs/heads/muellerzr-speedup-inference","pushedAt":"2024-07-16T12:42:40.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"muellerzr","name":"Zach Mueller","path":"/muellerzr","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7831895?s=80&v=4"},"commit":{"message":"Should be a not flag","shortMessageHtmlLink":"Should be a not flag"}},{"before":"ac946aac257cadfa8264fa4a284cd0ea1061c5b5","after":"03a3becc48f14a481b578c4d1c02273da9a1cc81","ref":"refs/heads/main","pushedAt":"2024-07-16T12:33:22.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"ArthurZucker","name":"Arthur","path":"/ArthurZucker","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/48595927?s=80&v=4"},"commit":{"message":"Cambricon MLUs support SDPA and flash_attn (#31102)\n\n* add Cambricon MLUs support\r\n\r\n* fix mlu device rng state\r\n\r\n* up for quality check\r\n\r\n* up mlu to support fp16\r\n\r\n* fix mlu device dependency error\r\n\r\n* fix mlu device dependency error\r\n\r\n* enable mlu device for bf16\r\n\r\n* fix mlu device memory tracker\r\n\r\n* Cambricon support SDPA and flash_attn","shortMessageHtmlLink":"Cambricon MLUs support SDPA and flash_attn (#31102)"}},{"before":"ada401f47424460b2e172f82ecfe8e7d8fa166cc","after":"1e5466a87d8cb0ecfccb2a3d799c74f6ebb00fae","ref":"refs/heads/muellerzr-speedup-inference","pushedAt":"2024-07-16T12:33:07.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"muellerzr","name":"Zach Mueller","path":"/muellerzr","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7831895?s=80&v=4"},"commit":{"message":"Fin","shortMessageHtmlLink":"Fin"}},{"before":"512f34adf125e04b58dc868cf83f725cb1276475","after":"ada401f47424460b2e172f82ecfe8e7d8fa166cc","ref":"refs/heads/muellerzr-speedup-inference","pushedAt":"2024-07-16T12:22:30.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"muellerzr","name":"Zach Mueller","path":"/muellerzr","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7831895?s=80&v=4"},"commit":{"message":"make private","shortMessageHtmlLink":"make private"}},{"before":"e8f4a1485d33cba589c856b6144aabba7aa10f1a","after":"512f34adf125e04b58dc868cf83f725cb1276475","ref":"refs/heads/muellerzr-speedup-inference","pushedAt":"2024-07-16T12:21:22.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"muellerzr","name":"Zach Mueller","path":"/muellerzr","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7831895?s=80&v=4"},"commit":{"message":"Adjust comment on skip","shortMessageHtmlLink":"Adjust comment on skip"}},{"before":"fd3890aceab3968dfc17155c0943551fafb11e50","after":"e8f4a1485d33cba589c856b6144aabba7aa10f1a","ref":"refs/heads/muellerzr-speedup-inference","pushedAt":"2024-07-16T12:20:13.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"muellerzr","name":"Zach Mueller","path":"/muellerzr","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7831895?s=80&v=4"},"commit":{"message":"Adjust comment","shortMessageHtmlLink":"Adjust comment"}},{"before":"c491952deb61fa790555e7463451e0530a0284e7","after":"fd3890aceab3968dfc17155c0943551fafb11e50","ref":"refs/heads/muellerzr-speedup-inference","pushedAt":"2024-07-16T12:11:10.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"muellerzr","name":"Zach Mueller","path":"/muellerzr","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7831895?s=80&v=4"},"commit":{"message":"Merge branch 'muellerzr-speedup-inference' of https://github.com/huggingface/transformers into muellerzr-speedup-inference","shortMessageHtmlLink":"Merge branch 'muellerzr-speedup-inference' of https://github.com/hugg…"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEgT6wCwA","startCursor":null,"endCursor":null}},"title":"Activity · huggingface/transformers"}