/
786edd87-476e-42a6-bcc0-521833ec73e5.json
137 lines (137 loc) · 3.72 KB
/
786edd87-476e-42a6-bcc0-521833ec73e5.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
{
"schema_version": "0.2.3",
"record_metadata": {
"uuid": "786edd87-476e-42a6-bcc0-521833ec73e5",
"record_created_on": "2022-09-08",
"record_created_by": "Kudela, Xenia Monika",
"last_edited_on": ""
},
"project": {
"title": "Open Islamicate Texts Initiative Arabic-script OCR Catalyst Project",
"abbr": "OpenITI AOCP",
"type": "project",
"ref": [],
"date": [
{
"from": "2019-09",
"to": "2021-12"
}
],
"maintained": null,
"websites": [
"https://openiti.org/projects/OpenITI%20AOCP%20Phase%20One.html",
"https://mith.umd.edu/research/openiti-aocp/"
],
"project_desc": "This project is led by an interdisciplinary team of humanities, computer science, and digital humanities co-principal investigators with the scope to challenge the technical and organizational barriers that historically have stymied the development of Arabic-script OCR and digital text production for Islamicate Studies. Its primary goal is to achieve approximately 97% character accuracy rates (CARs) for OCR on the most used Persian and Arabic print typefaces.",
"places": [
{
"place_name": {
"text": "College Park",
"ref": ["https://www.geonames.org/4351977/college-park.html"]
},
"coordinates": {
"lat": "38.98067",
"lng": "-76.93692"
}
},
{
"place_name": {
"text": "Leipzig",
"ref": ["https://www.geonames.org/2879139/leipzig.html"]
},
"coordinates": {
"lat": "51.33962",
"lng": "12.37129"
}
},
{
"place_name": {
"text": "London",
"ref": ["https://www.geonames.org/2643743/london.html"]
},
"coordinates": {
"lat": "51.50853",
"lng": "-0.12574"
}
},
{
"place_name": {
"text": "Vienna",
"ref": ["https://www.geonames.org/2761369/vienna.html"]
},
"coordinates": {
"lat": "48.20849",
"lng": "16.37208"
}
}
],
"lang": ["eng"],
"related_institutions": [],
"related_entities": [
{
"relation_type": "parent",
"title": "Open Islamicate Texts Initiative",
"uuid": "bef2e507-b663-422e-9dd3-7e49ca299f05"
},
{
"relation_type": "parent",
"title": "SHARIAsource",
"uuid": "1b2ca0bf-fb29-4b5c-852b-2eedd6a85773"
},
{
"relation_type": "sibling",
"title": "Automatic Collation for Diversifying Corpora",
"uuid": "5e7ab61a-0c33-44fc-8175-a1930e6d08bc"
},
{
"relation_type": "sibling",
"title": "CorpusBuilder",
"uuid": "eb1591d7-75b9-4d62-9f67-0679e627587b"
}
],
"contacts": [
{
"pers_name": {
"text": "Allen, Jonathan",
"ref": []
},
"roles": ["investigation"],
"websites": ["https://sllc.umd.edu/directory/jonathan-allen"]
}
],
"research_data": {
"lang": ["ara", "fas", "tur", "urd"],
"sustainability_plan": null,
"publications": {
"open_access": 0,
"licensing": [""]
},
"data": {
"datatypes": [],
"repositories": []
}
},
"stack": {
"database": ["sql", "xml", "json", "nosql"],
"backend": ["laravel"],
"frontend": ["vue"],
"tools": [],
"languages": ["php", "javascript", "python"]
},
"policies": [
{
"description": "",
"ref": []
}
],
"keywords": [
"corpus_resource",
"islamic_studies",
"machine_learning",
"nlp",
"ocr"
],
"category": "tools_and_analysis",
"comment": ""
}
}