{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":758581331,"defaultBranch":"master","name":"minbpe","ownerLogin":"karpathy","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2024-02-16T16:18:15.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/241138?v=4","public":true,"private":false,"isOrgOwned":false},"refInfo":{"name":"","listCacheKey":"v0:1708100296.0","currentOid":""},"activityList":{"items":[{"before":"2963f82739b1f420093941aaf89944bf4d9947f1","after":"1acefe89412b20245db5a22d2a02001e547dc602","ref":"refs/heads/master","pushedAt":"2024-04-22T22:11:37.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #67 from shubham0204/master\n\nadd `gnp/minbpe-rs` as community extensions in `README.md`","shortMessageHtmlLink":"Merge pull request #67 from shubham0204/master"}},{"before":"173b67f3d6cb0e7ab89fae0359c8b444ce3e10ad","after":"2963f82739b1f420093941aaf89944bf4d9947f1","ref":"refs/heads/master","pushedAt":"2024-02-26T23:56:33.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #43 from AneeshBose/aneesh/lecture-md\n\nfix minor issue in token count","shortMessageHtmlLink":"Merge pull request #43 from AneeshBose/aneesh/lecture-md"}},{"before":"d201df864173e9d947432673ba428428bed5d311","after":"173b67f3d6cb0e7ab89fae0359c8b444ce3e10ad","ref":"refs/heads/master","pushedAt":"2024-02-23T00:08:06.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"ugh fix image link","shortMessageHtmlLink":"ugh fix image link"}},{"before":"9324a08729f2d21635e88ea201faae659fb0f4d3","after":"d201df864173e9d947432673ba428428bed5d311","ref":"refs/heads/master","pushedAt":"2024-02-23T00:05:18.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"more work on lecture hehe. this is hard work! not sure an LLM can do this tbh","shortMessageHtmlLink":"more work on lecture hehe. this is hard work! not sure an LLM can do …"}},{"before":"966f46b20844494ea2ec48b8c65650e1c1b4f31a","after":"9324a08729f2d21635e88ea201faae659fb0f4d3","ref":"refs/heads/master","pushedAt":"2024-02-22T23:20:37.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"text version of the lecture","shortMessageHtmlLink":"text version of the lecture"}},{"before":"f50ad93aa65072ac23e0a7e0bbc64c9c4e26cc4a","after":"966f46b20844494ea2ec48b8c65650e1c1b4f31a","ref":"refs/heads/master","pushedAt":"2024-02-21T15:38:59.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #33 from richzw/master\n\nupdate readme.md with video link","shortMessageHtmlLink":"Merge pull request #33 from richzw/master"}},{"before":"a98e0a57d83b37d7a7e124ac55e4ad55934df535","after":"f50ad93aa65072ac23e0a7e0bbc64c9c4e26cc4a","ref":"refs/heads/master","pushedAt":"2024-02-20T18:58:17.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #24 from nobleaustine/pytest_modify\n\nupdated .gitignore","shortMessageHtmlLink":"Merge pull request #24 from nobleaustine/pytest_modify"}},{"before":"1cc9d069bbc99a7f91e9c778ad777d2dc134b0b2","after":"a98e0a57d83b37d7a7e124ac55e4ad55934df535","ref":"refs/heads/master","pushedAt":"2024-02-19T20:43:08.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"create exercise to rewrite minbpe for learners","shortMessageHtmlLink":"create exercise to rewrite minbpe for learners"}},{"before":"872c086335b2766487b8f9922ff6965a19de5f29","after":"1cc9d069bbc99a7f91e9c778ad777d2dc134b0b2","ref":"refs/heads/master","pushedAt":"2024-02-19T18:07:19.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"add small amount of code to write out the gpt4 vocab in the same format as the base class, taking into account the byte shuffle","shortMessageHtmlLink":"add small amount of code to write out the gpt4 vocab in the same form…"}},{"before":"f7122fe1695c8fb92f004b029029cd98827f12b8","after":"872c086335b2766487b8f9922ff6965a19de5f29","ref":"refs/heads/master","pushedAt":"2024-02-19T17:47:21.000Z","pushType":"pr_merge","commitsCount":3,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #18 from ahmedivy/master\n\nAdd requirements.txt","shortMessageHtmlLink":"Merge pull request #18 from ahmedivy/master"}},{"before":"aac75c8e35be097ee79455098948ceef97aa8ac1","after":"f7122fe1695c8fb92f004b029029cd98827f12b8","ref":"refs/heads/master","pushedAt":"2024-02-19T17:45:20.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"add link to another relevant issue here","shortMessageHtmlLink":"add link to another relevant issue here"}},{"before":"ade909f8af2e9534ea3d2f37f68e96e9703ebcac","after":"aac75c8e35be097ee79455098948ceef97aa8ac1","ref":"refs/heads/master","pushedAt":"2024-02-19T16:15:00.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #17 from eltociear/patch-1\n\nUpdate regex.py","shortMessageHtmlLink":"Merge pull request #17 from eltociear/patch-1"}},{"before":"4ccf644f552943a1868d816766bb0fdd8900bc73","after":"ade909f8af2e9534ea3d2f37f68e96e9703ebcac","ref":"refs/heads/master","pushedAt":"2024-02-19T16:13:46.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"change the handling of special tokens inside encode of RegexTokenizer, make the default behavior consistent with tiktoken, i.e. the person has to explicitly declare intent to use or not use special tokens in encoding, if they are present","shortMessageHtmlLink":"change the handling of special tokens inside encode of RegexTokenizer…"}},{"before":"37b63c28f77f9d01a2e86a55b8ac99826265a889","after":"4ccf644f552943a1868d816766bb0fdd8900bc73","ref":"refs/heads/master","pushedAt":"2024-02-19T15:52:39.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"refactor the readme file and adjust the API on how special tokens are handled","shortMessageHtmlLink":"refactor the readme file and adjust the API on how special tokens are…"}},{"before":"e82c123ca452a3c8698a26f8e0b37e5c898799e7","after":"37b63c28f77f9d01a2e86a55b8ac99826265a889","ref":"refs/heads/master","pushedAt":"2024-02-19T14:54:52.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"fix pytest -v, it was printing all of taylor swift text","shortMessageHtmlLink":"fix pytest -v, it was printing all of taylor swift text"}},{"before":"e0ed1bc84ec495e493482aea23eff382a0262c33","after":"e82c123ca452a3c8698a26f8e0b37e5c898799e7","ref":"refs/heads/master","pushedAt":"2024-02-19T14:45:39.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"meaty change: adding special tokens handling, so now we have full parity with the GPT-4 Tokenizer","shortMessageHtmlLink":"meaty change: adding special tokens handling, so now we have full par…"}},{"before":"9ab2500a6733ce5336b493f2c00055c85de25138","after":"e0ed1bc84ec495e493482aea23eff382a0262c33","ref":"refs/heads/master","pushedAt":"2024-02-18T16:11:42.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"add small warnings about gpt4 tokenizer just being a pretrained tokenizer","shortMessageHtmlLink":"add small warnings about gpt4 tokenizer just being a pretrained token…"}},{"before":"7843c9627b34eb15c67799b335cd6017c13e8aeb","after":"9ab2500a6733ce5336b493f2c00055c85de25138","ref":"refs/heads/master","pushedAt":"2024-02-18T15:50:57.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"maintain todos","shortMessageHtmlLink":"maintain todos"}},{"before":"ff20c9205ba4621a2a1b725130b557ace9c400de","after":"7843c9627b34eb15c67799b335cd6017c13e8aeb","ref":"refs/heads/master","pushedAt":"2024-02-18T15:27:02.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"optimization: allow get_stats to update an existing counts dict. train.py runtime goes from 32s to 22s doing this. ty @gklab for original suggestion in a PR","shortMessageHtmlLink":"optimization: allow get_stats to update an existing counts dict. trai…"}},{"before":"b52bf9b3943ad0f1511e40aacaa9838ae5446a12","after":"ff20c9205ba4621a2a1b725130b557ace9c400de","ref":"refs/heads/master","pushedAt":"2024-02-18T15:15:35.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #13 from gklab/spelling_error\n\nAdjust comments & block commit of the models folder","shortMessageHtmlLink":"Merge pull request #13 from gklab/spelling_error"}},{"before":"a0a05f80f7e2e5cf5f5ecb6abb653acd9c821f64","after":"b52bf9b3943ad0f1511e40aacaa9838ae5446a12","ref":"refs/heads/master","pushedAt":"2024-02-18T15:13:24.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"decompose long line here","shortMessageHtmlLink":"decompose long line here"}},{"before":"f9e19ea00d51f7d449d0cf90a5529ade6081ac04","after":"a0a05f80f7e2e5cf5f5ecb6abb653acd9c821f64","ref":"refs/heads/master","pushedAt":"2024-02-18T02:17:30.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"gitignore add","shortMessageHtmlLink":"gitignore add"}},{"before":"a04b85accaf34190fdc5d2f966923fde3edd2fa0","after":"f9e19ea00d51f7d449d0cf90a5529ade6081ac04","ref":"refs/heads/master","pushedAt":"2024-02-18T02:16:28.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"add caution around save/load of gpt4 tokenizer","shortMessageHtmlLink":"add caution around save/load of gpt4 tokenizer"}},{"before":"ac3ca85205bbf882ce5d7fc59935f5f9ed51103e","after":"a04b85accaf34190fdc5d2f966923fde3edd2fa0","ref":"refs/heads/master","pushedAt":"2024-02-18T01:14:45.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"let's not clutter the main directory","shortMessageHtmlLink":"let's not clutter the main directory"}},{"before":"d278867d2ae0a408a28df4d2b717f47d26017661","after":"ac3ca85205bbf882ce5d7fc59935f5f9ed51103e","ref":"refs/heads/master","pushedAt":"2024-02-18T01:02:21.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"major refactor to make this a sensible package with nice tests etc. we almost look legitimate now","shortMessageHtmlLink":"major refactor to make this a sensible package with nice tests etc. w…"}},{"before":"3e684139cbcc46df590791ae3dd91d611f4051ac","after":"d278867d2ae0a408a28df4d2b717f47d26017661","ref":"refs/heads/master","pushedAt":"2024-02-18T00:37:52.000Z","pushType":"push","commitsCount":5,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge branch 'ViswanathaReddyGajjala-master'","shortMessageHtmlLink":"Merge branch 'ViswanathaReddyGajjala-master'"}},{"before":"2c521cba8b598a7af22931da9f632c3fa0773ed1","after":"3e684139cbcc46df590791ae3dd91d611f4051ac","ref":"refs/heads/master","pushedAt":"2024-02-17T17:20:05.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"remove educational as constraint. i think we might be able to make this repo have teeth and have some more optimized versions. but we'd keep the simple reference code","shortMessageHtmlLink":"remove educational as constraint. i think we might be able to make th…"}},{"before":"02e9e20b2500ac9e8910902b79b3830aa0556e23","after":"2c521cba8b598a7af22931da9f632c3fa0773ed1","ref":"refs/heads/master","pushedAt":"2024-02-17T17:18:38.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"major changes and refactoring, creating base class, joining the utility functions, and adding the save/load functionality in the base class","shortMessageHtmlLink":"major changes and refactoring, creating base class, joining the utili…"}},{"before":"cc7fb340d82031eef1ae2a1706256f570830e1e6","after":"02e9e20b2500ac9e8910902b79b3830aa0556e23","ref":"refs/heads/master","pushedAt":"2024-02-17T01:20:41.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #1 from cyrilzakka/master\n\nFixes imports in train.py","shortMessageHtmlLink":"Merge pull request #1 from cyrilzakka/master"}},{"before":"43ffc2f4410a53a34b950e47fa7b42cec6101108","after":"cc7fb340d82031eef1ae2a1706256f570830e1e6","ref":"refs/heads/master","pushedAt":"2024-02-17T00:01:24.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"mild improve docs","shortMessageHtmlLink":"mild improve docs"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEN3oUiwA","startCursor":null,"endCursor":null}},"title":"Activity · karpathy/minbpe"}