{"payload":{"pageCount":2,"repositories":[{"type":"Public","name":"labelpropagation_clothing","owner":"ONSBigData","isFork":false,"description":"Code to accompany the Data and Policy and Ottawa group paper","allTopics":[],"primaryLanguage":{"name":"HTML","color":"#e34c26"},"pullRequestCount":2,"issueCount":0,"starsCount":2,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-07-06T21:42:24.050Z"}},{"type":"Public","name":"drift_detection_model_retraining","owner":"ONSBigData","isFork":false,"description":"Drift detection and model retraining methods","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":null,"participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-11-28T14:03:21.986Z"}},{"type":"Public","name":"scikit-learn-imputer","owner":"ONSBigData","isFork":false,"description":"Imputation tool for categorical and continuous data using scikit-learn algorithms. Includes simulation study and model persistence.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":1,"license":null,"participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-06-22T14:12:08.139Z"}},{"type":"Public","name":"ONSBigData.github.io","owner":"ONSBigData","isFork":false,"description":"The ONS Big Data Team Github pages","allTopics":["data-science","statistics","big-data","ons","office-for-national-statistics","official-statistics","github-page"],"primaryLanguage":{"name":"HTML","color":"#e34c26"},"pullRequestCount":1,"issueCount":0,"starsCount":10,"forksCount":2,"license":"MIT License","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2021-05-19T01:33:41.834Z"}},{"type":"Public","name":"precon","owner":"ONSBigData","isFork":false,"description":"Functions for price index economics.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":8,"starsCount":5,"forksCount":1,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2021-03-30T10:59:58.581Z"}},{"type":"Public","name":"housing-websites","owner":"ONSBigData","isFork":false,"description":"Collect data from Zoopla then use machine learning to identify caravans","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":16,"forksCount":6,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2020-10-01T12:57:46.933Z"}},{"type":"Public","name":"synthetic4linkage","owner":"ONSBigData","isFork":false,"description":"Creating synthetic data for testing clerical linkage interface","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":2,"license":null,"participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2020-05-21T08:25:32.505Z"}},{"type":"Public","name":"companies_house_ocr_runner","owner":"ONSBigData","isFork":false,"description":"Runs Tesseract OCR over PDF paper filings from Companies House.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":0,"forksCount":4,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2020-01-06T17:50:27.304Z"}},{"type":"Public","name":"companies_house_filing_fetcher","owner":"ONSBigData","isFork":false,"description":"Downloads paper filings from the Companies House API","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":3,"forksCount":3,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2020-01-06T16:35:28.640Z"}},{"type":"Public","name":"dcm-transcripts-new","owner":"ONSBigData","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":null,"participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2019-12-02T11:00:05.347Z"}},{"type":"Public","name":"scala_udf_example","owner":"ONSBigData","isFork":false,"description":"Using Scala to create a Spark UDF designed to be callable from PySpark.","allTopics":[],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":0,"issueCount":0,"starsCount":4,"forksCount":2,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2019-11-13T10:53:13.290Z"}},{"type":"Public","name":"exploring_companies_house","owner":"ONSBigData","isFork":false,"description":"exploring and data checking companies house data read from pdfs","allTopics":[],"primaryLanguage":{"name":"HTML","color":"#e34c26"},"pullRequestCount":0,"issueCount":0,"starsCount":2,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2019-08-08T10:57:38.646Z"}},{"type":"Public","name":"zip_to_sequence_file","owner":"ONSBigData","isFork":false,"description":"Command line utility to convert zip archives into Hadoop Sequence Files","allTopics":[],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":1,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2019-04-21T09:11:25.208Z"}},{"type":"Public","name":"parsing_company_accounts","owner":"ONSBigData","isFork":false,"description":"Reading digital XBRL/iXBRL account documents - for sharing","allTopics":[],"primaryLanguage":{"name":"HTML","color":"#e34c26"},"pullRequestCount":0,"issueCount":2,"starsCount":43,"forksCount":17,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2019-02-28T16:02:51.960Z"}},{"type":"Public","name":"traffic_as_early_indicator","owner":"ONSBigData","isFork":false,"description":"Files for a brief report investigating if traffic flow (Annual average daily flow) could be used as an early indicator for GDP","allTopics":[],"primaryLanguage":{"name":"HTML","color":"#e34c26"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2019-01-07T11:28:26.740Z"}},{"type":"Public","name":"textanalysisGUI","owner":"ONSBigData","isFork":false,"description":"Python web GUI for text analysis purposes. ","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2018-11-21T21:39:13.681Z"}},{"type":"Public","name":"pycon-uk-2018","owner":"ONSBigData","isFork":false,"description":"feedback from PyCon UK 2018","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2018-10-15T14:10:02.408Z"}},{"type":"Public","name":"rise-presentation","owner":"ONSBigData","isFork":false,"description":"Small self-contained RISE presentation example","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2018-10-05T11:09:00.847Z"}},{"type":"Public","name":"spark_udf_benchmark_example","owner":"ONSBigData","isFork":false,"description":"Timed runs of Scala and Python UDFs in Spark (on a Virtual Machine). ","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2018-09-20T12:18:35.709Z"}},{"type":"Public","name":"RSS-2018","owner":"ONSBigData","isFork":false,"description":"Traffic flow as an early indicator for GDP ","allTopics":[],"primaryLanguage":{"name":"HTML","color":"#e34c26"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":1,"license":"GNU General Public License v3.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2018-09-12T16:12:48.546Z"}},{"type":"Public","name":"revealjs-demo","owner":"ONSBigData","isFork":false,"description":"reveal.js demo slides","allTopics":[],"primaryLanguage":{"name":"HTML","color":"#e34c26"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":2,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2018-07-27T15:08:58.627Z"}},{"type":"Public","name":"dsc-lunch","owner":"ONSBigData","isFork":false,"description":"slides for dsc lunch","allTopics":[],"primaryLanguage":{"name":"HTML","color":"#e34c26"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2018-07-16T17:22:58.778Z"}},{"type":"Public","name":"bristol_data_dive","owner":"ONSBigData","isFork":false,"description":"Repo for work from the Bristol data dive: http://www.data4sdgs.org/news/bristol-data-dive","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":0,"starsCount":2,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2018-04-24T09:47:30.972Z"}},{"type":"Public","name":"housing_clf","owner":"ONSBigData","isFork":false,"description":"Classification of restricted access properties and caravans within Zoopla Data","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":0,"starsCount":2,"forksCount":1,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2018-04-18T13:50:04.176Z"}},{"type":"Public","name":"Scraping-demo","owner":"ONSBigData","isFork":false,"description":"Web scraping demo files","allTopics":["demo","webscraping"],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":0,"starsCount":2,"forksCount":1,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2018-03-13T09:39:28.468Z"}},{"type":"Public","name":"Clustering_paper","owner":"ONSBigData","isFork":false,"description":"Working paper and notebook for unsupervised document clustering","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":0,"starsCount":11,"forksCount":5,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2018-03-06T14:18:07.070Z"}},{"type":"Public","name":"ESSnet-WP7-UK-Case-Study","owner":"ONSBigData","isFork":false,"description":"Explore how we might produce statistics on social sentiment from news/social media towards events/topics and how those can be linked to existing official statistics which annually measure population well-being","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":2,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2017-12-04T13:11:44.267Z"}},{"type":"Public","name":"ExtracTED","owner":"ONSBigData","isFork":false,"description":"Scripts to extract and parse TED (Tenders Electronic Daily: http://ted.europa.eu/TED/main/HomePage.do) documents.","allTopics":["python","open-source","tenders","open-data","xml-parser"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":15,"forksCount":8,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2017-12-01T16:24:55.876Z"}},{"type":"Public","name":"OpencellID-analysis","owner":"ONSBigData","isFork":false,"description":"Comparing densities of mobile cell towers with population estimates","allTopics":[],"primaryLanguage":{"name":"R","color":"#198CE7"},"pullRequestCount":0,"issueCount":0,"starsCount":11,"forksCount":6,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2017-10-17T15:48:37.406Z"}},{"type":"Public","name":"LCF-project","owner":"ONSBigData","isFork":false,"description":"Repository for the Big Data Team work on the LCF Project","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":2,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2017-09-21T10:37:25.895Z"}}],"repositoryCount":37,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"Repositories"}