{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":522950827,"defaultBranch":"main","name":"bigcode-evaluation-harness","ownerLogin":"bigcode-project","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2022-08-09T12:58:56.000Z","ownerAvatar":"https://github.com/avatars/u/110470554?v=4","public":true,"private":false,"isOrgOwned":true},"refInfo":{"name":"","listCacheKey":"v0:1721082730.0","currentOid":""},"activityList":{"items":[{"before":"8eed6237611fe516b64d323980e56d4b26fa316d","after":null,"ref":"refs/heads/MultiPL-Ev3","pushedAt":"2024-07-15T22:32:10.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"arjunguha","name":"Arjun Guha","path":"/arjunguha","primaryAvatarUrl":"https://github.com/avatars/u/20065?s=80&v=4"}},{"before":"06108e49684185221457a37269da103dca870b6f","after":null,"ref":"refs/heads/arjunguha-patch-1","pushedAt":"2024-07-15T22:32:07.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"arjunguha","name":"Arjun Guha","path":"/arjunguha","primaryAvatarUrl":"https://github.com/avatars/u/20065?s=80&v=4"}},{"before":"a83b1ca85163558e131a3cb4d33a4a7930c92cb4","after":"0f3e95f0806e78a4f432056cdb1be93604a51d69","ref":"refs/heads/main","pushedAt":"2024-07-14T18:07:56.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"loubnabnl","name":"Loubna Ben Allal","path":"/loubnabnl","primaryAvatarUrl":"https://github.com/avatars/u/44069155?s=80&v=4"},"commit":{"message":"Merge pull request #255 from bigcode-project/arjunguha-patch-1\n\nUpdate Dockerfile-multiple","shortMessageHtmlLink":"Merge pull request #255 from bigcode-project/arjunguha-patch-1"}},{"before":"334efb7feb1c6d18fc4be2c71ae73248f3de8440","after":"a83b1ca85163558e131a3cb4d33a4a7930c92cb4","ref":"refs/heads/main","pushedAt":"2024-07-14T18:07:06.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"loubnabnl","name":"Loubna Ben Allal","path":"/loubnabnl","primaryAvatarUrl":"https://github.com/avatars/u/44069155?s=80&v=4"},"commit":{"message":"Merge pull request #254 from bigcode-project/MultiPL-Ev3\n\nUpdate MultiPL-E to v3 prompts","shortMessageHtmlLink":"Merge pull request #254 from bigcode-project/MultiPL-Ev3"}},{"before":null,"after":"06108e49684185221457a37269da103dca870b6f","ref":"refs/heads/arjunguha-patch-1","pushedAt":"2024-07-12T14:02:17.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"arjunguha","name":"Arjun Guha","path":"/arjunguha","primaryAvatarUrl":"https://github.com/avatars/u/20065?s=80&v=4"},"commit":{"message":"Update Dockerfile-multiple\n\nThis updates the MultiPL-E Dockerfile to support v3.\r\n\r\nInstead of copy-pasta like before, I've had it inherit from the MultiPL-E native evaluation container. It is set to use an exact revision -- which is the v3 revision -- so we won't get any surprise updates.","shortMessageHtmlLink":"Update Dockerfile-multiple"}},{"before":null,"after":"8eed6237611fe516b64d323980e56d4b26fa316d","ref":"refs/heads/MultiPL-Ev3","pushedAt":"2024-07-12T13:36:38.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"arjunguha","name":"Arjun Guha","path":"/arjunguha","primaryAvatarUrl":"https://github.com/avatars/u/20065?s=80&v=4"},"commit":{"message":"Update MultiPL-E to v3 prompts\n\nI've put together a new MultiPL-E release, v3 and this updates the harness to point to the new prompts.\r\n\r\nThere are fixes to old prompts as well as support for new languages, both described on the MultiPL-E dataset page. The nature of fixes is that some PLs have their scores go up a little. I've tested with with StarCoder2-15B (using VLLM) and will continue testing other models.","shortMessageHtmlLink":"Update MultiPL-E to v3 prompts"}},{"before":"4659ecdafb0f7973e4d27942b559ff24bc7f192e","after":"334efb7feb1c6d18fc4be2c71ae73248f3de8440","ref":"refs/heads/main","pushedAt":"2024-06-24T09:22:25.000Z","pushType":"pr_merge","commitsCount":5,"pusher":{"login":"loubnabnl","name":"Loubna Ben Allal","path":"/loubnabnl","primaryAvatarUrl":"https://github.com/avatars/u/44069155?s=80&v=4"},"commit":{"message":"Merge pull request #244 from meher-m/transformers_fix\n\nAdding support for transformers>=4.40.2 to avoid crash with mbpp","shortMessageHtmlLink":"Merge pull request #244 from meher-m/transformers_fix"}},{"before":"f0f2b52ab0bac95b7fa881693e82c5ddcf2f9e95","after":"4659ecdafb0f7973e4d27942b559ff24bc7f192e","ref":"refs/heads/main","pushedAt":"2024-06-21T09:33:30.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"loubnabnl","name":"Loubna Ben Allal","path":"/loubnabnl","primaryAvatarUrl":"https://github.com/avatars/u/44069155?s=80&v=4"},"commit":{"message":"Merge pull request #247 from anil-gurbuz/leaderboard-documentation-fix\n\nFix: Leaderboard submission Documentation","shortMessageHtmlLink":"Merge pull request #247 from anil-gurbuz/leaderboard-documentation-fix"}},{"before":"84b96da31b7f840b55c5733325346176140cdb6b","after":"f0f2b52ab0bac95b7fa881693e82c5ddcf2f9e95","ref":"refs/heads/main","pushedAt":"2024-05-29T22:30:12.000Z","pushType":"pr_merge","commitsCount":23,"pusher":{"login":"loubnabnl","name":"Loubna Ben Allal","path":"/loubnabnl","primaryAvatarUrl":"https://github.com/avatars/u/44069155?s=80&v=4"},"commit":{"message":"Merge pull request #238 from Elfsong/mercury\n\nAdd a new dataset Mercury","shortMessageHtmlLink":"Merge pull request #238 from Elfsong/mercury"}},{"before":"a1b4a7949a24c8e3ef0d05a01097b2d14ffba56e","after":"84b96da31b7f840b55c5733325346176140cdb6b","ref":"refs/heads/main","pushedAt":"2024-05-05T22:31:13.000Z","pushType":"pr_merge","commitsCount":3,"pusher":{"login":"loubnabnl","name":"Loubna Ben Allal","path":"/loubnabnl","primaryAvatarUrl":"https://github.com/avatars/u/44069155?s=80&v=4"},"commit":{"message":"Merge pull request #232 from shehrozek-cerebras/make_bigcode_pip_installable\n\nAdd package name and enforce python version in `setup.py`","shortMessageHtmlLink":"Merge pull request #232 from shehrozek-cerebras/make_bigcode_pip_inst…"}},{"before":"1b0147c50f406ff66ac4f806230479f31d19c7e6","after":"a1b4a7949a24c8e3ef0d05a01097b2d14ffba56e","ref":"refs/heads/main","pushedAt":"2024-04-23T18:09:11.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"arjunguha","name":"Arjun Guha","path":"/arjunguha","primaryAvatarUrl":"https://github.com/avatars/u/20065?s=80&v=4"},"commit":{"message":"Add StudentEval from LLM4Code 2024","shortMessageHtmlLink":"Add StudentEval from LLM4Code 2024"}},{"before":"642c57f138390828c743a748469c2a82d9bff72b","after":"1b0147c50f406ff66ac4f806230479f31d19c7e6","ref":"refs/heads/main","pushedAt":"2024-04-19T21:47:34.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"loubnabnl","name":"Loubna Ben Allal","path":"/loubnabnl","primaryAvatarUrl":"https://github.com/avatars/u/44069155?s=80&v=4"},"commit":{"message":"Merge pull request #223 from ganler/evalplus-maintain\n\nrefactor(evalplus): maintain mbpp+ v0.2.0","shortMessageHtmlLink":"Merge pull request #223 from ganler/evalplus-maintain"}},{"before":"094c7cc197d13a53c19303865e2056f1c7488ac1","after":"642c57f138390828c743a748469c2a82d9bff72b","ref":"refs/heads/main","pushedAt":"2024-04-16T20:06:52.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"loubnabnl","name":"Loubna Ben Allal","path":"/loubnabnl","primaryAvatarUrl":"https://github.com/avatars/u/44069155?s=80&v=4"},"commit":{"message":"Merge pull request #219 from bigcode-project/loubnabnl-patch-9\n\nAdd instruct models prompts","shortMessageHtmlLink":"Merge pull request #219 from bigcode-project/loubnabnl-patch-9"}},{"before":null,"after":"0cf6eaed1c284e873c5cc491ab722be3e586f515","ref":"refs/heads/loubnabnl-patch-9","pushedAt":"2024-04-16T20:06:18.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"loubnabnl","name":"Loubna Ben Allal","path":"/loubnabnl","primaryAvatarUrl":"https://github.com/avatars/u/44069155?s=80&v=4"},"commit":{"message":"Add instruct models prompts","shortMessageHtmlLink":"Add instruct models prompts"}},{"before":"e54f33d093f342ffc0c5c057910c00aa2081515d","after":"094c7cc197d13a53c19303865e2056f1c7488ac1","ref":"refs/heads/main","pushedAt":"2024-03-27T15:54:36.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"Muennighoff","name":"Niklas Muennighoff","path":"/Muennighoff","primaryAvatarUrl":"https://github.com/avatars/u/62820084?s=80&v=4"},"commit":{"message":"Merge pull request #208 from bigcode-project/aurora-prompt\n\nAdd prompt","shortMessageHtmlLink":"Merge pull request #208 from bigcode-project/aurora-prompt"}},{"before":null,"after":"974c7ed1ec23d4c5c95ab08eb8bdec43cc6d8a10","ref":"refs/heads/aurora-prompt","pushedAt":"2024-03-21T15:22:26.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"Muennighoff","name":"Niklas Muennighoff","path":"/Muennighoff","primaryAvatarUrl":"https://github.com/avatars/u/62820084?s=80&v=4"},"commit":{"message":"Add prompt","shortMessageHtmlLink":"Add prompt"}},{"before":"849481c0b540780dd65cc4d8071b9e0be8e75839","after":"e54f33d093f342ffc0c5c057910c00aa2081515d","ref":"refs/heads/main","pushedAt":"2024-03-01T10:01:22.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"loubnabnl","name":"Loubna Ben Allal","path":"/loubnabnl","primaryAvatarUrl":"https://github.com/avatars/u/44069155?s=80&v=4"},"commit":{"message":"Merge pull request #201 from bigcode-project/issueprompt\n\nAdd issue prompt","shortMessageHtmlLink":"Merge pull request #201 from bigcode-project/issueprompt"}},{"before":"d4243c40f47077517ea002fff7f0653c5d1430a0","after":"b52b68ac577644151e46d63d68881faed7253e13","ref":"refs/heads/astraios","pushedAt":"2024-02-26T15:34:10.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"terryyz","name":"Terry Zhuo","path":"/terryyz","primaryAvatarUrl":"https://github.com/avatars/u/36221214?s=80&v=4"},"commit":{"message":"Update aatk.py","shortMessageHtmlLink":"Update aatk.py"}},{"before":null,"after":"1e4bb7e830a314264f51471ae189924157b3544d","ref":"refs/heads/issueprompt","pushedAt":"2024-02-26T09:09:59.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"Muennighoff","name":"Niklas Muennighoff","path":"/Muennighoff","primaryAvatarUrl":"https://github.com/avatars/u/62820084?s=80&v=4"},"commit":{"message":"Add issue prompt","shortMessageHtmlLink":"Add issue prompt"}},{"before":"2ec01598062766350cf79a11ff05d08fc16373ac","after":"849481c0b540780dd65cc4d8071b9e0be8e75839","ref":"refs/heads/main","pushedAt":"2024-02-17T07:52:30.000Z","pushType":"pr_merge","commitsCount":4,"pusher":{"login":"Muennighoff","name":"Niklas Muennighoff","path":"/Muennighoff","primaryAvatarUrl":"https://github.com/avatars/u/62820084?s=80&v=4"},"commit":{"message":"Merge pull request #199 from bigcode-project/addprompts\n\nAdd prompts","shortMessageHtmlLink":"Merge pull request #199 from bigcode-project/addprompts"}},{"before":"d2ea11591a2d7bf741475821e16a7bf83bc022fd","after":"649d82bbf225086ec2045fdf8cf9908999b3bcbb","ref":"refs/heads/addprompts","pushedAt":"2024-02-17T07:52:11.000Z","pushType":"push","commitsCount":3,"pusher":{"login":"Muennighoff","name":"Niklas Muennighoff","path":"/Muennighoff","primaryAvatarUrl":"https://github.com/avatars/u/62820084?s=80&v=4"},"commit":{"message":"Merge branch 'main' into addprompts","shortMessageHtmlLink":"Merge branch 'main' into addprompts"}},{"before":"00967d12093ef614de7bdad0772aed8e4118f1fd","after":"2ec01598062766350cf79a11ff05d08fc16373ac","ref":"refs/heads/main","pushedAt":"2024-02-16T22:04:18.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"loubnabnl","name":"Loubna Ben Allal","path":"/loubnabnl","primaryAvatarUrl":"https://github.com/avatars/u/44069155?s=80&v=4"},"commit":{"message":"Merge pull request #194 from bigcode-project/loubnabnl-patch-8\n\nadd support for codellama-70b prompt","shortMessageHtmlLink":"Merge pull request #194 from bigcode-project/loubnabnl-patch-8"}},{"before":"09c4002bb0d2704147bb12f58c834f252f7f35f5","after":"d2ea11591a2d7bf741475821e16a7bf83bc022fd","ref":"refs/heads/addprompts","pushedAt":"2024-02-16T11:32:49.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Muennighoff","name":"Niklas Muennighoff","path":"/Muennighoff","primaryAvatarUrl":"https://github.com/avatars/u/62820084?s=80&v=4"},"commit":{"message":"Add refs","shortMessageHtmlLink":"Add refs"}},{"before":null,"after":"09c4002bb0d2704147bb12f58c834f252f7f35f5","ref":"refs/heads/addprompts","pushedAt":"2024-02-16T11:29:48.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"Muennighoff","name":"Niklas Muennighoff","path":"/Muennighoff","primaryAvatarUrl":"https://github.com/avatars/u/62820084?s=80&v=4"},"commit":{"message":"Add prompts","shortMessageHtmlLink":"Add prompts"}},{"before":null,"after":"0261c520c6636455e78da289e8e17cce2bacf629","ref":"refs/heads/loubnabnl-patch-8","pushedAt":"2024-01-29T18:57:47.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"loubnabnl","name":"Loubna Ben Allal","path":"/loubnabnl","primaryAvatarUrl":"https://github.com/avatars/u/44069155?s=80&v=4"},"commit":{"message":"add support for codellama-70b prompt","shortMessageHtmlLink":"add support for codellama-70b prompt"}},{"before":"9cfa52b2819e686363ac3a9feb6f3c096e0d47a3","after":"00967d12093ef614de7bdad0772aed8e4118f1fd","ref":"refs/heads/main","pushedAt":"2024-01-29T18:41:14.000Z","pushType":"pr_merge","commitsCount":4,"pusher":{"login":"loubnabnl","name":"Loubna Ben Allal","path":"/loubnabnl","primaryAvatarUrl":"https://github.com/avatars/u/44069155?s=80&v=4"},"commit":{"message":"Merge pull request #190 from ganler/mbppplus\n\nAdd mbpp+ evaluation task","shortMessageHtmlLink":"Merge pull request #190 from ganler/mbppplus"}},{"before":"efd2121679d765e7db993e0e2be5cea801d5f84d","after":"a7b1b6e29f304d0e882c7cb429c327d80c40b6e7","ref":"refs/heads/raymond-fix-gsm","pushedAt":"2024-01-23T19:50:48.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"RaymondLi0","name":null,"path":"/RaymondLi0","primaryAvatarUrl":"https://github.com/avatars/u/11444023?s=80&v=4"},"commit":{"message":"gsm: stop at stop tokens","shortMessageHtmlLink":"gsm: stop at stop tokens"}},{"before":"3910745963a41df129eae8823836cc30a43088c9","after":"9cfa52b2819e686363ac3a9feb6f3c096e0d47a3","ref":"refs/heads/main","pushedAt":"2024-01-23T10:21:45.000Z","pushType":"pr_merge","commitsCount":4,"pusher":{"login":"loubnabnl","name":"Loubna Ben Allal","path":"/loubnabnl","primaryAvatarUrl":"https://github.com/avatars/u/44069155?s=80&v=4"},"commit":{"message":"Merge pull request #187 from ganler/heplus\n\nAdd humaneval+ evaluation task","shortMessageHtmlLink":"Merge pull request #187 from ganler/heplus"}},{"before":null,"after":"efd2121679d765e7db993e0e2be5cea801d5f84d","ref":"refs/heads/raymond-fix-gsm","pushedAt":"2024-01-22T15:36:42.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"RaymondLi0","name":null,"path":"/RaymondLi0","primaryAvatarUrl":"https://github.com/avatars/u/11444023?s=80&v=4"},"commit":{"message":"catch if intermediate generations file not found","shortMessageHtmlLink":"catch if intermediate generations file not found"}},{"before":"e4fd5634fd63eb4b1e23c5fd10a54aa2bb29f8b8","after":"3910745963a41df129eae8823836cc30a43088c9","ref":"refs/heads/main","pushedAt":"2024-01-19T18:02:44.000Z","pushType":"pr_merge","commitsCount":3,"pusher":{"login":"loubnabnl","name":"Loubna Ben Allal","path":"/loubnabnl","primaryAvatarUrl":"https://github.com/avatars/u/44069155?s=80&v=4"},"commit":{"message":"Merge pull request #184 from bigcode-project/support-left-pad\n\nsupport left padding and prefix post-processing for models like chatglm","shortMessageHtmlLink":"Merge pull request #184 from bigcode-project/support-left-pad"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEgC3vQwA","startCursor":null,"endCursor":null}},"title":"Activity · bigcode-project/bigcode-evaluation-harness"}