{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":743505633,"defaultBranch":"dev","name":"dap_job_quality","ownerLogin":"nestauk","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2024-01-15T11:36:42.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/14215708?v=4","public":true,"private":false,"isOrgOwned":true},"refInfo":{"name":"","listCacheKey":"v0:1718626426.0","currentOid":""},"activityList":{"items":[{"before":"a55d5bcfbde777c743ccc8c7dec6f059929d0acd","after":"def33c96a84ac95642bb29f39aeb0daac7f90190","ref":"refs/heads/52-ngrams","pushedAt":"2024-06-18T17:04:38.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"},"commit":{"message":"Make parent directories if they do not exist","shortMessageHtmlLink":"Make parent directories if they do not exist"}},{"before":"1cf1670ae8922cd4ad838a8fb6c8403009428caa","after":"a55d5bcfbde777c743ccc8c7dec6f059929d0acd","ref":"refs/heads/52-ngrams","pushedAt":"2024-06-18T16:18:30.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"},"commit":{"message":"WIP: create unique identifier from id and index","shortMessageHtmlLink":"WIP: create unique identifier from id and index"}},{"before":"998a176f99aea7ab80f23fee2fd275ea4eec3e55","after":"1cf1670ae8922cd4ad838a8fb6c8403009428caa","ref":"refs/heads/52-ngrams","pushedAt":"2024-06-18T16:14:16.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"},"commit":{"message":"Make sure dependencies are loaded","shortMessageHtmlLink":"Make sure dependencies are loaded"}},{"before":"2da7709be89b5f97175b71e29722b75eaf6e146f","after":"998a176f99aea7ab80f23fee2fd275ea4eec3e55","ref":"refs/heads/52-ngrams","pushedAt":"2024-06-18T16:03:15.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"},"commit":{"message":"WIP: early years analysis pipeline. Refactor notebook into scripts","shortMessageHtmlLink":"WIP: early years analysis pipeline. Refactor notebook into scripts"}},{"before":"d9466e107d0d76cfdb06631ef449e206d78b79a5","after":"2da7709be89b5f97175b71e29722b75eaf6e146f","ref":"refs/heads/52-ngrams","pushedAt":"2024-06-18T10:14:23.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"},"commit":{"message":"WIP: plumbing extraction of JQ sentences and ngrams","shortMessageHtmlLink":"WIP: plumbing extraction of JQ sentences and ngrams"}},{"before":"6204b892d07983ce7fff3ece1bfcfce6e8815198","after":null,"ref":"refs/heads/53-jq-link-ey-descriptions","pushedAt":"2024-06-17T12:13:46.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"}},{"before":"8cd8891e8338edfc80491763cbcd02b7323070cd","after":"d9466e107d0d76cfdb06631ef449e206d78b79a5","ref":"refs/heads/52-ngrams","pushedAt":"2024-06-17T08:56:46.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"},"commit":{"message":"WIP: small updates","shortMessageHtmlLink":"WIP: small updates"}},{"before":"2eb73b17e7b9e9fc4715a40f8fd07c36909cd7c8","after":"8cd8891e8338edfc80491763cbcd02b7323070cd","ref":"refs/heads/52-ngrams","pushedAt":"2024-06-17T08:49:38.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"},"commit":{"message":"WIP: save models","shortMessageHtmlLink":"WIP: save models"}},{"before":"8a7ad33a6af2dcbb044f92b5a52fe261ed21437f","after":"2eb73b17e7b9e9fc4715a40f8fd07c36909cd7c8","ref":"refs/heads/52-ngrams","pushedAt":"2024-06-17T08:25:20.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"},"commit":{"message":"WIP: updating file structure","shortMessageHtmlLink":"WIP: updating file structure"}},{"before":"ba93f16d36c48dc5aaab695aff9201028cac7353","after":"8a7ad33a6af2dcbb044f92b5a52fe261ed21437f","ref":"refs/heads/52-ngrams","pushedAt":"2024-06-17T08:19:51.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"},"commit":{"message":"WIP: small changes to make the code work on ec2","shortMessageHtmlLink":"WIP: small changes to make the code work on ec2"}},{"before":"fbb4ad9d7320928312ca6b3dc54aeb411c53d775","after":"ba93f16d36c48dc5aaab695aff9201028cac7353","ref":"refs/heads/52-ngrams","pushedAt":"2024-06-17T08:02:03.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"},"commit":{"message":"WIP: getting JQ sentences from retail and EYP sample","shortMessageHtmlLink":"WIP: getting JQ sentences from retail and EYP sample"}},{"before":"a31b2533d15e5a29f61838c16da6342455badd32","after":"fbb4ad9d7320928312ca6b3dc54aeb411c53d775","ref":"refs/heads/52-ngrams","pushedAt":"2024-06-13T17:02:59.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"},"commit":{"message":"Tweak logistic regression code to work on aws","shortMessageHtmlLink":"Tweak logistic regression code to work on aws"}},{"before":"54e3fc4341910eacb444af1b1005b333f037e125","after":"a31b2533d15e5a29f61838c16da6342455badd32","ref":"refs/heads/52-ngrams","pushedAt":"2024-06-13T16:52:45.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"},"commit":{"message":"Add logging","shortMessageHtmlLink":"Add logging"}},{"before":"3f35118e9defbf9d4bd586d731996e5a26b50fd9","after":null,"ref":"refs/heads/clean-ey-datasets","pushedAt":"2024-06-13T16:43:32.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"lizgzil","name":"Liz G","path":"/lizgzil","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15956065?s=80&v=4"}},{"before":"fdeb656674dee2f3515f9d45989593edddbf5d9e","after":"546277e14742344909fb06b3d4a9cb3fa77fd468","ref":"refs/heads/dev","pushedAt":"2024-06-13T16:43:29.000Z","pushType":"pr_merge","commitsCount":4,"pusher":{"login":"lizgzil","name":"Liz G","path":"/lizgzil","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15956065?s=80&v=4"},"commit":{"message":"Merge pull request #54 from nestauk/clean-ey-datasets\n\nAdd cleaned descriptions to EY and similar occ datasets","shortMessageHtmlLink":"Merge pull request #54 from nestauk/clean-ey-datasets"}},{"before":"3eb72c6d520b8e7ddfa6ffaf6ddfa4cbc1da0c59","after":"3f35118e9defbf9d4bd586d731996e5a26b50fd9","ref":"refs/heads/clean-ey-datasets","pushedAt":"2024-06-13T16:43:01.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lizgzil","name":"Liz G","path":"/lizgzil","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15956065?s=80&v=4"},"commit":{"message":"Add mock pipeline","shortMessageHtmlLink":"Add mock pipeline"}},{"before":"d3ff0e6d4bd5730527ffa03a74b56bad63c447f8","after":"54e3fc4341910eacb444af1b1005b333f037e125","ref":"refs/heads/52-ngrams","pushedAt":"2024-06-13T16:36:48.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"},"commit":{"message":"WIP","shortMessageHtmlLink":"WIP"}},{"before":"7c98e81ef631c13785f4e8b9af6947822f772059","after":null,"ref":"refs/heads/50-chunk-sentences","pushedAt":"2024-06-13T16:04:12.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"}},{"before":"6204b892d07983ce7fff3ece1bfcfce6e8815198","after":"fdeb656674dee2f3515f9d45989593edddbf5d9e","ref":"refs/heads/dev","pushedAt":"2024-06-13T16:04:09.000Z","pushType":"pr_merge","commitsCount":4,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"},"commit":{"message":"Merge pull request #51 from nestauk/50-chunk-sentences\n\nInvestigate rule-based splitting of sentences","shortMessageHtmlLink":"Merge pull request #51 from nestauk/50-chunk-sentences"}},{"before":"83f318d31fd7d68dfdd05308ccd9b91043699fd1","after":"3eb72c6d520b8e7ddfa6ffaf6ddfa4cbc1da0c59","ref":"refs/heads/clean-ey-datasets","pushedAt":"2024-06-13T14:12:48.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lizgzil","name":"Liz G","path":"/lizgzil","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15956065?s=80&v=4"},"commit":{"message":"revert to previous replacements and add Rosie's change too","shortMessageHtmlLink":"revert to previous replacements and add Rosie's change too"}},{"before":null,"after":"83f318d31fd7d68dfdd05308ccd9b91043699fd1","ref":"refs/heads/clean-ey-datasets","pushedAt":"2024-06-13T14:06:33.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"lizgzil","name":"Liz G","path":"/lizgzil","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15956065?s=80&v=4"},"commit":{"message":"Add new cleaning functions and script to add cleaned descriptions to EY job ads and similar occupations","shortMessageHtmlLink":"Add new cleaning functions and script to add cleaned descriptions to …"}},{"before":"52b8d2f76599e73b483e0309fd4f9de2efcd94da","after":"d3ff0e6d4bd5730527ffa03a74b56bad63c447f8","ref":"refs/heads/52-ngrams","pushedAt":"2024-06-13T14:03:35.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"},"commit":{"message":"Add script for calculating most common ngrams","shortMessageHtmlLink":"Add script for calculating most common ngrams"}},{"before":"6204b892d07983ce7fff3ece1bfcfce6e8815198","after":"52b8d2f76599e73b483e0309fd4f9de2efcd94da","ref":"refs/heads/52-ngrams","pushedAt":"2024-06-13T12:56:53.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"},"commit":{"message":"WIP: update prodigy utils for handling new labelled data","shortMessageHtmlLink":"WIP: update prodigy utils for handling new labelled data"}},{"before":null,"after":"6204b892d07983ce7fff3ece1bfcfce6e8815198","ref":"refs/heads/53-jq-link-ey-descriptions","pushedAt":"2024-06-13T12:55:58.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"},"commit":{"message":"Merge pull request #43 from nestauk/42-hotfix-classify-sentences\n\nTrain model on sentences; add random state to PCA","shortMessageHtmlLink":"Merge pull request #43 from nestauk/42-hotfix-classify-sentences"}},{"before":"393c5b6d9a8c54b66c08b668ec7fbc561123e9fc","after":"524d43623496225ca125d72dea50674ff5ae02bd","ref":"refs/heads/29_test_category_mapping_techniques","pushedAt":"2024-06-13T06:38:05.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"},"commit":{"message":"Update labelled_data.py\n\nCorrect file name","shortMessageHtmlLink":"Update labelled_data.py"}},{"before":null,"after":"6204b892d07983ce7fff3ece1bfcfce6e8815198","ref":"refs/heads/52-ngrams","pushedAt":"2024-06-12T18:17:34.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"},"commit":{"message":"Merge pull request #43 from nestauk/42-hotfix-classify-sentences\n\nTrain model on sentences; add random state to PCA","shortMessageHtmlLink":"Merge pull request #43 from nestauk/42-hotfix-classify-sentences"}},{"before":"5d1068b3868a31fc7507146f28910951531883e8","after":"7c98e81ef631c13785f4e8b9af6947822f772059","ref":"refs/heads/50-chunk-sentences","pushedAt":"2024-06-11T09:22:16.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"},"commit":{"message":"Refactor chunking approach slightly; improve text cleaning","shortMessageHtmlLink":"Refactor chunking approach slightly; improve text cleaning"}},{"before":"56e97a908a487855fa1c6cbc5b44ff8a515bf497","after":"5d1068b3868a31fc7507146f28910951531883e8","ref":"refs/heads/50-chunk-sentences","pushedAt":"2024-06-11T07:35:25.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"},"commit":{"message":"Try out rule-based sentence splitting","shortMessageHtmlLink":"Try out rule-based sentence splitting"}},{"before":"6204b892d07983ce7fff3ece1bfcfce6e8815198","after":"56e97a908a487855fa1c6cbc5b44ff8a515bf497","ref":"refs/heads/50-chunk-sentences","pushedAt":"2024-06-10T16:14:17.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"},"commit":{"message":"Investigate rule-based splitting of sentences","shortMessageHtmlLink":"Investigate rule-based splitting of sentences"}},{"before":null,"after":"6204b892d07983ce7fff3ece1bfcfce6e8815198","ref":"refs/heads/50-chunk-sentences","pushedAt":"2024-06-10T16:13:04.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"RFOxbury","name":"Rosie Oxbury","path":"/RFOxbury","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/49554920?s=80&v=4"},"commit":{"message":"Merge pull request #43 from nestauk/42-hotfix-classify-sentences\n\nTrain model on sentences; add random state to PCA","shortMessageHtmlLink":"Merge pull request #43 from nestauk/42-hotfix-classify-sentences"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEaLcU7QA","startCursor":null,"endCursor":null}},"title":"Activity · nestauk/dap_job_quality"}