generated from GLAM-Workbench/glam-workbench-template
/
.zenodo.json
41 lines (41 loc) · 2.83 KB
/
.zenodo.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
{
"language": "eng",
"license": "MIT",
"title": "GLAM-Workbench/libraries-tasmania",
"related_identifiers": [
{
"scheme": "url",
"identifier": "https://github.com/GLAM-Workbench/libraries-tasmania/tree/v1.0.0",
"relation": "isDerivedFrom",
"resource_type": "software"
},
{
"scheme": "url",
"identifier": "https://glam-workbench.net/libraries-tasmania/",
"relation": "isDocumentedBy",
"resource_type": "publication-softwaredocumentation"
},
{
"scheme": "url",
"identifier": "https://glam-workbench.net/",
"relation": "isPartOf",
"resource_type": "other"
}
],
"version": "v1.0.0",
"upload_type": "software",
"keywords": [
"digital humanities",
"Jupyter",
"GLAM Workbench"
],
"publication_date": "2022-09-15",
"creators": [
{
"name": "Sherratt, Tim",
"orcid": "0000-0001-7956-4498"
}
],
"access_right": "open",
"description": "<p>Current version: <a href=\"https://github.com/GLAM-Workbench/libraries-tasmania/releases/tag/v1.0.0\">v1.0.0</a></p> <p>Tools and examples for working with data from <a href=\"https://www.libraries.tas.gov.au/\">Libraries Tasmania</a>. For more information see the <a href=\"https://glam-workbench.net/libraries-tasmania/\">Libraries Tasmania</a> section of the GLAM Workbench.</p> <h2 id=\"tasmanian-post-office-directories\">Tasmanian Post Office Directories</h2> <p>The <a href=\"https://stors.tas.gov.au/ILS/SD_ILS-981598\">Tasmanian Post Office Directories from 1890 to 1948</a> have been digitised and made available by Libraries Tasmania for download as PDFs. These notebooks document a workflow that extracts text and images from the PDFs to build a <a href=\"https://glam-workbench.net/tasmanian-post-office-directories/\">searchable database of their contents</a>.</p> <ul> <li>Download and process Tasmanian Post Office Directory PDFs – downloads all 48 PDFs, then extracts images and text from the PDFs using PyMuPDF</li> <li>Upload Tasmanian Post Office Directory images to Amazon s3 for IIIF – converts the images into pyramidal TIFFs using pyvips and then uploads them to an Amazon s3 bucket for delivery via IIIF</li> <li>Extract text from PDF images using Tesseract – uses Tesseract to extract text from the images</li> <li>Add content from the Tasmanian Post Office Directories to an SQLite database – brings everything together in an SQLite database ready for delivery through Datasette</li> </ul> <p>See the <a href=\"https://glam-workbench.github.io/libraries-tasmania/\">GLAM Workbench for more details</a>.</p> <h2 id=\"cite-as\">Cite as</h2> <p>See the GLAM Workbench or <a href=\"https://doi.org/10.5281/zenodo.3521724\">Zenodo</a> for up-to-date citation details.</p> <hr /> <p>This repository is part of the <a href=\"https://glam-workbench.github.io/\">GLAM Workbench</a>.</p>"
}