{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":777121135,"defaultBranch":"main","name":"LLMTrainingOnJeanZay","ownerLogin":"OpenLLM-France","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2024-03-25T08:40:53.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/136799956?v=4","public":true,"private":false,"isOrgOwned":true},"refInfo":{"name":"","listCacheKey":"v0:1711960412.0","currentOid":""},"activityList":{"items":[{"before":"74e53b94d7081e74637daaab86c227c0812249af","after":"71fb9e4f342558b52f350fad205a1d6e4df3e9e3","ref":"refs/heads/main","pushedAt":"2024-04-20T05:15:00.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"ok pour lire le corpus en random avec des seek, mais le corpus n'a pas l'air top, allemand, espagnol, bcp de fautes d OCR, FR trop ancien, des series de chiffres","shortMessageHtmlLink":"ok pour lire le corpus en random avec des seek, mais le corpus n'a pa…"}},{"before":"be88ac1d357443ee39866160e37137df8d050a68","after":"74e53b94d7081e74637daaab86c227c0812249af","ref":"refs/heads/main","pushedAt":"2024-04-20T04:50:06.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"pickle too slow","shortMessageHtmlLink":"pickle too slow"}},{"before":"e25e9b49022b8867c55946756cddeb5b3cd0f255","after":"be88ac1d357443ee39866160e37137df8d050a68","ref":"refs/heads/main","pushedAt":"2024-04-19T07:59:25.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"seek seems OK","shortMessageHtmlLink":"seek seems OK"}},{"before":"1d654f0e613a240834b5c3daf8702dad53c02789","after":"e25e9b49022b8867c55946756cddeb5b3cd0f255","ref":"refs/heads/main","pushedAt":"2024-04-19T05:20:54.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"ok","shortMessageHtmlLink":"ok"}},{"before":"09dd4cd562f6e6a6e8ec0ce271cc6916513f6b85","after":"1d654f0e613a240834b5c3daf8702dad53c02789","ref":"refs/heads/main","pushedAt":"2024-04-19T05:19:51.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"11 jours pour tout tokenizer","shortMessageHtmlLink":"11 jours pour tout tokenizer"}},{"before":"60103cae2dc85d26d9b6f8e551e39e3672be24cd","after":"09dd4cd562f6e6a6e8ec0ce271cc6916513f6b85","ref":"refs/heads/main","pushedAt":"2024-04-18T19:24:17.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"TODO: try with datasets multithread loader","shortMessageHtmlLink":"TODO: try with datasets multithread loader"}},{"before":"de90b22ed99a3355dbd53847d860d9e176b0dc52","after":"60103cae2dc85d26d9b6f8e551e39e3672be24cd","ref":"refs/heads/main","pushedAt":"2024-04-18T19:05:18.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"pb tokenizer trop lent","shortMessageHtmlLink":"pb tokenizer trop lent"}},{"before":"f08ceb2a92ce7c7101a9812824963dff34674f2f","after":"de90b22ed99a3355dbd53847d860d9e176b0dc52","ref":"refs/heads/main","pushedAt":"2024-04-18T16:31:29.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"ok","shortMessageHtmlLink":"ok"}},{"before":"519063e9c821f76cf710c8a689781c3fa560c178","after":"f08ceb2a92ce7c7101a9812824963dff34674f2f","ref":"refs/heads/main","pushedAt":"2024-04-18T16:09:06.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"ok","shortMessageHtmlLink":"ok"}},{"before":"d3e5d0e10e30602fe949b6ceda2ef4716217d974","after":"519063e9c821f76cf710c8a689781c3fa560c178","ref":"refs/heads/main","pushedAt":"2024-04-18T07:20:11.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"ok","shortMessageHtmlLink":"ok"}},{"before":"452d3292ebc725a671940c03968d34ff49c5068e","after":"d3e5d0e10e30602fe949b6ceda2ef4716217d974","ref":"refs/heads/main","pushedAt":"2024-04-18T05:17:32.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"trop lent","shortMessageHtmlLink":"trop lent"}},{"before":"ea78f1f5acfe0d0a18c4ed19501228797a31d84b","after":"452d3292ebc725a671940c03968d34ff49c5068e","ref":"refs/heads/main","pushedAt":"2024-04-17T18:59:28.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"TODO: relaunch fullcorpus2 to process all data; check dsbloom for seek() time","shortMessageHtmlLink":"TODO: relaunch fullcorpus2 to process all data; check dsbloom for see…"}},{"before":"bb1efedebc3d8a0250fd9737c97c230558b2962e","after":"ea78f1f5acfe0d0a18c4ed19501228797a31d84b","ref":"refs/heads/main","pushedAt":"2024-04-12T06:55:14.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"ok","shortMessageHtmlLink":"ok"}},{"before":"9a6273235d6c1d4e341a0f9e27743d26f9a1737b","after":"bb1efedebc3d8a0250fd9737c97c230558b2962e","ref":"refs/heads/main","pushedAt":"2024-04-11T18:56:33.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"ok","shortMessageHtmlLink":"ok"}},{"before":"6557d0094c8f9e7b65b6bea02f026fc3a36997fe","after":"9a6273235d6c1d4e341a0f9e27743d26f9a1737b","ref":"refs/heads/main","pushedAt":"2024-04-11T18:00:07.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"ok","shortMessageHtmlLink":"ok"}},{"before":"d40965cef2f37304d7caed21be4a3bce92f8f43b","after":"6557d0094c8f9e7b65b6bea02f026fc3a36997fe","ref":"refs/heads/main","pushedAt":"2024-04-11T17:20:23.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"ok","shortMessageHtmlLink":"ok"}},{"before":"e846441dfc950e416de1bc95ae3348f8febf21a3","after":"d40965cef2f37304d7caed21be4a3bce92f8f43b","ref":"refs/heads/main","pushedAt":"2024-04-11T17:08:04.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"ok","shortMessageHtmlLink":"ok"}},{"before":"da5ed6f6d5b76834647d00e91b9ca2013fe292fc","after":"e846441dfc950e416de1bc95ae3348f8febf21a3","ref":"refs/heads/main","pushedAt":"2024-04-10T18:27:47.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"ok","shortMessageHtmlLink":"ok"}},{"before":"a4318b9e160d58578cb7a43bea21a48645f161fd","after":"da5ed6f6d5b76834647d00e91b9ca2013fe292fc","ref":"refs/heads/main","pushedAt":"2024-04-10T17:57:48.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"trying continual learning from bloom7b on Lucie training corpus","shortMessageHtmlLink":"trying continual learning from bloom7b on Lucie training corpus"}},{"before":"e37925a75ab0cf5591e812f7325ad012e81e60a1","after":"a4318b9e160d58578cb7a43bea21a48645f161fd","ref":"refs/heads/main","pushedAt":"2024-04-10T13:12:30.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"ok","shortMessageHtmlLink":"ok"}},{"before":"600fb97da160c2ca2f335de94e74812fa5ecd50d","after":"e37925a75ab0cf5591e812f7325ad012e81e60a1","ref":"refs/heads/main","pushedAt":"2024-04-10T05:59:01.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"ok","shortMessageHtmlLink":"ok"}},{"before":"8a084b5b3bfcc18017fb555d056066adf00ae4fc","after":"600fb97da160c2ca2f335de94e74812fa5ecd50d","ref":"refs/heads/main","pushedAt":"2024-04-09T16:53:34.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"un 2eme fichier de croissan_aligned qui ne se lit pas bien","shortMessageHtmlLink":"un 2eme fichier de croissan_aligned qui ne se lit pas bien"}},{"before":"1c687468bc52f7dd6cabb62ae646249230b298b3","after":"8a084b5b3bfcc18017fb555d056066adf00ae4fc","ref":"refs/heads/main","pushedAt":"2024-04-09T12:21:58.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"Merge branch 'main' of github.com:OpenLLM-France/LLMTrainingOnJeanZay into main","shortMessageHtmlLink":"Merge branch 'main' of github.com:OpenLLM-France/LLMTrainingOnJeanZay…"}},{"before":"b5f4c627083164336272053c0276f4b9c2540333","after":"1c687468bc52f7dd6cabb62ae646249230b298b3","ref":"refs/heads/main","pushedAt":"2024-04-08T19:23:26.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"ok","shortMessageHtmlLink":"ok"}},{"before":"f3282072d50ab1f4142fe79ca13e3c9efa1fd2db","after":"b5f4c627083164336272053c0276f4b9c2540333","ref":"refs/heads/main","pushedAt":"2024-04-08T14:25:19.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"try single file to evaluate seek()","shortMessageHtmlLink":"try single file to evaluate seek()"}},{"before":"b51e56631cba1470f1a10683d8dd93efb7baaf4f","after":"f3282072d50ab1f4142fe79ca13e3c9efa1fd2db","ref":"refs/heads/main","pushedAt":"2024-04-08T12:59:40.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"ok","shortMessageHtmlLink":"ok"}},{"before":"6116ff778dd360bcf775ba4af5a3939deb14e520","after":"b51e56631cba1470f1a10683d8dd93efb7baaf4f","ref":"refs/heads/main","pushedAt":"2024-04-08T12:57:38.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"ok","shortMessageHtmlLink":"ok"}},{"before":"1e1c070a48410e8f4050e324abd9dd841c33c914","after":"6116ff778dd360bcf775ba4af5a3939deb14e520","ref":"refs/heads/main","pushedAt":"2024-04-08T12:08:46.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"ok","shortMessageHtmlLink":"ok"}},{"before":"bd371e7708008ca9302b49ba96adb295eb2a152f","after":"1e1c070a48410e8f4050e324abd9dd841c33c914","ref":"refs/heads/main","pushedAt":"2024-04-06T19:33:55.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"try with basic python seek()","shortMessageHtmlLink":"try with basic python seek()"}},{"before":"9f82becdcf567bcb954462c148c0e64555baded1","after":"bd371e7708008ca9302b49ba96adb295eb2a152f","ref":"refs/heads/main","pushedAt":"2024-04-02T19:22:38.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"cerisara","name":"Christophe Cerisara","path":"/cerisara","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/520973?s=80&v=4"},"commit":{"message":"converts .parquet files into pyarrow format for random access","shortMessageHtmlLink":"converts .parquet files into pyarrow format for random access"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAENbHNEgA","startCursor":null,"endCursor":null}},"title":"Activity · OpenLLM-France/LLMTrainingOnJeanZay"}