From a7041857ff59ba2ef1f1bdb33303364c0a24c9ea Mon Sep 17 00:00:00 2001 From: Eric Herman Date: Thu, 22 Jul 2021 10:50:58 +0200 Subject: [PATCH 1/5] Add DPG: tico-19 (translation initiative for covid 19, Issue #555) --- ...ion-initiative-for-covid-19-(tico-19).json | 98 +++++++++++++++++++ 1 file changed, 98 insertions(+) create mode 100644 digitalpublicgoods/translation-initiative-for-covid-19-(tico-19).json diff --git a/digitalpublicgoods/translation-initiative-for-covid-19-(tico-19).json b/digitalpublicgoods/translation-initiative-for-covid-19-(tico-19).json new file mode 100644 index 000000000..142463c44 --- /dev/null +++ b/digitalpublicgoods/translation-initiative-for-covid-19-(tico-19).json @@ -0,0 +1,98 @@ +{ + "name": "Translation Initiative for Covid-19 (TICO-19)", + "clearOwnership": { + "isOwnershipExplicit": "Yes", + "copyrightURL": "https://tico-19.github.io/" + }, + "platformIndependence": { + "mandatoryDepsCreateMoreRestrictions": "No", + "isSoftwarePltIndependent": "", + "pltIndependenceDesc": "" + }, + "documentation": { + "isDocumentationAvailable": "Yes", + "documentationURL": [ + "https://tico-19.github.io/index.html" + ] + }, + "NonPII": { + "collectsNonPII": "No", + "checkNonPIIAccessMechanism": "", + "nonPIIAccessMechanism": "" + }, + "privacy": { + "isPrivacyCompliant": "Yes", + "privacyComplianceList": [ + "" + ], + "adherenceSteps": [ + "" + ] + }, + "standards": { + "supportStandards": "Yes", + "standardsList": [ + "The data collection followed established industry standards for fair compensation. The released dataset has also been reviewed through a rigorous quality assurance process, which exceeds the typical academic standards and follows industry standards." + ], + "evidenceStandardSupport": [ + "" + ], + "implementBestPractices": "Yes", + "bestPracticesList": [ + "See answer above. The data collection followed established industry standards for fair compensation. The released dataset has also been reviewed through a rigorous quality assurance process, which exceeds the typical academic standards and follows higher-quality translation industry standards." + ] + }, + "doNoHarm": { + "preventHarm": { + "stepsToPreventHarm": "Yes", + "additionalInfoMechanismProcessesPolicies": "Yes. A major potential from harm relating to COVID-19 is the spread of misinformation. As such, the team made sure that all originally selected documents came from trusted sources and did not include unsubstantiated claims.\nAnother potential harm could result from potential mistranslations of the COVID-19 content, which could inadvertently provide misleading information. Thus, we followed a rigorous quality assurance process involving professional translators with medical expertise, to ensure that the terminologies and translations are as accurate as possible." + }, + "dataPrivacySecurity": { + "collectsPII": "No", + "typesOfDataCollected": [ + "" + ], + "thirdPartyDataSharing": "Unknown", + "dataSharingCircumstances": [ + "" + ], + "ensurePrivacySecurity": "Unknown", + "privacySecurityDescription": "" + }, + "inappropriateIllegalContent": { + "collectStoreDistribute": "Yes", + "type": "Yes, the project created and distributed translations memories, terminologies and a public translation benchmark that includes 30 documents (3071 sentences, 69.7k words) translated from English into 36 languages", + "illegalContentDetection": "Yes", + "illegalContentDetectionMechanism": "Yes, the project created and distributed translations memories, terminologies and a public translation benchmark that includes 30 documents (3071 sentences, 69.7k words) translated from English into 36 languages: Amharic, Arabic (Modern Standard), Bengali, Chinese (Simplified), Dari, Dinka, Farsi, French (European), Hausa, Hindi, Indonesian, Kanuri, Khmer (Central), Kinyarwanda, Kurdish Kurmanji, Kurdish Sorani, Lingala, Luganda, Malay, Marathi, Myanmar, Nepali, Nigerian Fulfulde, Nuer, Oromo, Pashto, Portuguese (Brazilian), Russian, Somali, Spanish (Latin American), Swahili, Congolese Swahili, Tagalog, Tamil, Tigrinya, Urdu, Zulu.\nThese documents were originally selected for their relevance to COVID-19, and they do not contain inappropriate or illegal content." + }, + "protectionFromHarassment": { + "userInteraction": "Yes", + "addressSafetySecurityUnderageUsers": "Yes", + "stepsAddressRiskPreventSafetyUnderageUsers": [ + "Yes, there is a call for community contributions: https://tico-19.github.io/translators.html", + "Professional translators are invited to share their translation memories or terminologies, as well as to use and potentially correct the provided datasets.", + "We also invite translations of the existing data to more languages.", + "", + "We do not anticipate any risk from underage or other users, hence we do not restrict access to anyone." + ], + "griefAbuseHarassmentProtection": "No", + "harassmentProtectionSteps": [ + "" + ] + } + }, + "locations": { + "developmentCountries": [ + "USA", + "Ireland", + "UK", + "Canada", + "Spain", + "Italy", + "Australia" + ], + "deploymentCountries": [ + "Worldwide" + ] + } +} From 992d397eaf4db97e756dcb0b73da807adeb9c7c7 Mon Sep 17 00:00:00 2001 From: nathanbaleeta Date: Thu, 12 Aug 2021 21:27:44 +0300 Subject: [PATCH 2/5] Update name field to match nominee --- .../translation-initiative-for-covid-19.json | 98 +++++++++++++++++++ 1 file changed, 98 insertions(+) create mode 100644 digitalpublicgoods/translation-initiative-for-covid-19.json diff --git a/digitalpublicgoods/translation-initiative-for-covid-19.json b/digitalpublicgoods/translation-initiative-for-covid-19.json new file mode 100644 index 000000000..51fd49205 --- /dev/null +++ b/digitalpublicgoods/translation-initiative-for-covid-19.json @@ -0,0 +1,98 @@ +{ + "name": "Translation Initiative for Covid-19", + "clearOwnership": { + "isOwnershipExplicit": "Yes", + "copyrightURL": "https://tico-19.github.io/" + }, + "platformIndependence": { + "mandatoryDepsCreateMoreRestrictions": "No", + "isSoftwarePltIndependent": "", + "pltIndependenceDesc": "" + }, + "documentation": { + "isDocumentationAvailable": "Yes", + "documentationURL": [ + "https://tico-19.github.io/index.html" + ] + }, + "NonPII": { + "collectsNonPII": "No", + "checkNonPIIAccessMechanism": "", + "nonPIIAccessMechanism": "" + }, + "privacy": { + "isPrivacyCompliant": "Yes", + "privacyComplianceList": [ + "" + ], + "adherenceSteps": [ + "" + ] + }, + "standards": { + "supportStandards": "Yes", + "standardsList": [ + "The data collection followed established industry standards for fair compensation. The released dataset has also been reviewed through a rigorous quality assurance process, which exceeds the typical academic standards and follows industry standards." + ], + "evidenceStandardSupport": [ + "" + ], + "implementBestPractices": "Yes", + "bestPracticesList": [ + "See answer above. The data collection followed established industry standards for fair compensation. The released dataset has also been reviewed through a rigorous quality assurance process, which exceeds the typical academic standards and follows higher-quality translation industry standards." + ] + }, + "doNoHarm": { + "preventHarm": { + "stepsToPreventHarm": "Yes", + "additionalInfoMechanismProcessesPolicies": "Yes. A major potential from harm relating to COVID-19 is the spread of misinformation. As such, the team made sure that all originally selected documents came from trusted sources and did not include unsubstantiated claims.\nAnother potential harm could result from potential mistranslations of the COVID-19 content, which could inadvertently provide misleading information. Thus, we followed a rigorous quality assurance process involving professional translators with medical expertise, to ensure that the terminologies and translations are as accurate as possible." + }, + "dataPrivacySecurity": { + "collectsPII": "No", + "typesOfDataCollected": [ + "" + ], + "thirdPartyDataSharing": "Unknown", + "dataSharingCircumstances": [ + "" + ], + "ensurePrivacySecurity": "Unknown", + "privacySecurityDescription": "" + }, + "inappropriateIllegalContent": { + "collectStoreDistribute": "Yes", + "type": "Yes, the project created and distributed translations memories, terminologies and a public translation benchmark that includes 30 documents (3071 sentences, 69.7k words) translated from English into 36 languages", + "illegalContentDetection": "Yes", + "illegalContentDetectionMechanism": "Yes, the project created and distributed translations memories, terminologies and a public translation benchmark that includes 30 documents (3071 sentences, 69.7k words) translated from English into 36 languages: Amharic, Arabic (Modern Standard), Bengali, Chinese (Simplified), Dari, Dinka, Farsi, French (European), Hausa, Hindi, Indonesian, Kanuri, Khmer (Central), Kinyarwanda, Kurdish Kurmanji, Kurdish Sorani, Lingala, Luganda, Malay, Marathi, Myanmar, Nepali, Nigerian Fulfulde, Nuer, Oromo, Pashto, Portuguese (Brazilian), Russian, Somali, Spanish (Latin American), Swahili, Congolese Swahili, Tagalog, Tamil, Tigrinya, Urdu, Zulu.\nThese documents were originally selected for their relevance to COVID-19, and they do not contain inappropriate or illegal content." + }, + "protectionFromHarassment": { + "userInteraction": "Yes", + "addressSafetySecurityUnderageUsers": "Yes", + "stepsAddressRiskPreventSafetyUnderageUsers": [ + "Yes, there is a call for community contributions: https://tico-19.github.io/translators.html", + "Professional translators are invited to share their translation memories or terminologies, as well as to use and potentially correct the provided datasets.", + "We also invite translations of the existing data to more languages.", + "", + "We do not anticipate any risk from underage or other users, hence we do not restrict access to anyone." + ], + "griefAbuseHarassmentProtection": "No", + "harassmentProtectionSteps": [ + "" + ] + } + }, + "locations": { + "developmentCountries": [ + "USA", + "Ireland", + "UK", + "Canada", + "Spain", + "Italy", + "Australia" + ], + "deploymentCountries": [ + "" + ] + } +} From 9f58294a407a9c52df5f6558cb8419abea9ab721 Mon Sep 17 00:00:00 2001 From: Nathan Baleeta Date: Thu, 12 Aug 2021 21:31:41 +0300 Subject: [PATCH 3/5] Delete translation-initiative-for-covid-19-(tico-19).json --- ...ion-initiative-for-covid-19-(tico-19).json | 98 ------------------- 1 file changed, 98 deletions(-) delete mode 100644 digitalpublicgoods/translation-initiative-for-covid-19-(tico-19).json diff --git a/digitalpublicgoods/translation-initiative-for-covid-19-(tico-19).json b/digitalpublicgoods/translation-initiative-for-covid-19-(tico-19).json deleted file mode 100644 index 142463c44..000000000 --- a/digitalpublicgoods/translation-initiative-for-covid-19-(tico-19).json +++ /dev/null @@ -1,98 +0,0 @@ -{ - "name": "Translation Initiative for Covid-19 (TICO-19)", - "clearOwnership": { - "isOwnershipExplicit": "Yes", - "copyrightURL": "https://tico-19.github.io/" - }, - "platformIndependence": { - "mandatoryDepsCreateMoreRestrictions": "No", - "isSoftwarePltIndependent": "", - "pltIndependenceDesc": "" - }, - "documentation": { - "isDocumentationAvailable": "Yes", - "documentationURL": [ - "https://tico-19.github.io/index.html" - ] - }, - "NonPII": { - "collectsNonPII": "No", - "checkNonPIIAccessMechanism": "", - "nonPIIAccessMechanism": "" - }, - "privacy": { - "isPrivacyCompliant": "Yes", - "privacyComplianceList": [ - "" - ], - "adherenceSteps": [ - "" - ] - }, - "standards": { - "supportStandards": "Yes", - "standardsList": [ - "The data collection followed established industry standards for fair compensation. The released dataset has also been reviewed through a rigorous quality assurance process, which exceeds the typical academic standards and follows industry standards." - ], - "evidenceStandardSupport": [ - "" - ], - "implementBestPractices": "Yes", - "bestPracticesList": [ - "See answer above. The data collection followed established industry standards for fair compensation. The released dataset has also been reviewed through a rigorous quality assurance process, which exceeds the typical academic standards and follows higher-quality translation industry standards." - ] - }, - "doNoHarm": { - "preventHarm": { - "stepsToPreventHarm": "Yes", - "additionalInfoMechanismProcessesPolicies": "Yes. A major potential from harm relating to COVID-19 is the spread of misinformation. As such, the team made sure that all originally selected documents came from trusted sources and did not include unsubstantiated claims.\nAnother potential harm could result from potential mistranslations of the COVID-19 content, which could inadvertently provide misleading information. Thus, we followed a rigorous quality assurance process involving professional translators with medical expertise, to ensure that the terminologies and translations are as accurate as possible." - }, - "dataPrivacySecurity": { - "collectsPII": "No", - "typesOfDataCollected": [ - "" - ], - "thirdPartyDataSharing": "Unknown", - "dataSharingCircumstances": [ - "" - ], - "ensurePrivacySecurity": "Unknown", - "privacySecurityDescription": "" - }, - "inappropriateIllegalContent": { - "collectStoreDistribute": "Yes", - "type": "Yes, the project created and distributed translations memories, terminologies and a public translation benchmark that includes 30 documents (3071 sentences, 69.7k words) translated from English into 36 languages", - "illegalContentDetection": "Yes", - "illegalContentDetectionMechanism": "Yes, the project created and distributed translations memories, terminologies and a public translation benchmark that includes 30 documents (3071 sentences, 69.7k words) translated from English into 36 languages: Amharic, Arabic (Modern Standard), Bengali, Chinese (Simplified), Dari, Dinka, Farsi, French (European), Hausa, Hindi, Indonesian, Kanuri, Khmer (Central), Kinyarwanda, Kurdish Kurmanji, Kurdish Sorani, Lingala, Luganda, Malay, Marathi, Myanmar, Nepali, Nigerian Fulfulde, Nuer, Oromo, Pashto, Portuguese (Brazilian), Russian, Somali, Spanish (Latin American), Swahili, Congolese Swahili, Tagalog, Tamil, Tigrinya, Urdu, Zulu.\nThese documents were originally selected for their relevance to COVID-19, and they do not contain inappropriate or illegal content." - }, - "protectionFromHarassment": { - "userInteraction": "Yes", - "addressSafetySecurityUnderageUsers": "Yes", - "stepsAddressRiskPreventSafetyUnderageUsers": [ - "Yes, there is a call for community contributions: https://tico-19.github.io/translators.html", - "Professional translators are invited to share their translation memories or terminologies, as well as to use and potentially correct the provided datasets.", - "We also invite translations of the existing data to more languages.", - "", - "We do not anticipate any risk from underage or other users, hence we do not restrict access to anyone." - ], - "griefAbuseHarassmentProtection": "No", - "harassmentProtectionSteps": [ - "" - ] - } - }, - "locations": { - "developmentCountries": [ - "USA", - "Ireland", - "UK", - "Canada", - "Spain", - "Italy", - "Australia" - ], - "deploymentCountries": [ - "Worldwide" - ] - } -} From 501715f43a724bdb6591cf572739c1deabbf9974 Mon Sep 17 00:00:00 2001 From: nathanbaleeta Date: Thu, 12 Aug 2021 23:16:30 +0300 Subject: [PATCH 4/5] Protection From Harassment indicator --- .../translation-initiative-for-covid-19.json | 15 +++++++-------- 1 file changed, 7 insertions(+), 8 deletions(-) diff --git a/digitalpublicgoods/translation-initiative-for-covid-19.json b/digitalpublicgoods/translation-initiative-for-covid-19.json index 51fd49205..063a4894c 100644 --- a/digitalpublicgoods/translation-initiative-for-covid-19.json +++ b/digitalpublicgoods/translation-initiative-for-covid-19.json @@ -23,10 +23,10 @@ "privacy": { "isPrivacyCompliant": "Yes", "privacyComplianceList": [ - "" + "The translations are free to use under a CC0 license." ], "adherenceSteps": [ - "" + "we strongly encourage that professional translators handle the technical content, and that you follow a rigorous process of Quality Assurance over the produced translations. " ] }, "standards": { @@ -52,12 +52,12 @@ "typesOfDataCollected": [ "" ], - "thirdPartyDataSharing": "Unknown", + "thirdPartyDataSharing": "No", "dataSharingCircumstances": [ "" ], - "ensurePrivacySecurity": "Unknown", - "privacySecurityDescription": "" + "ensurePrivacySecurity": "Yes", + "privacySecurityDescription": "we strongly encourage that professional translators handle the technical content, and that you follow a rigorous process of Quality Assurance over the produced translations." }, "inappropriateIllegalContent": { "collectStoreDistribute": "Yes", @@ -72,12 +72,11 @@ "Yes, there is a call for community contributions: https://tico-19.github.io/translators.html", "Professional translators are invited to share their translation memories or terminologies, as well as to use and potentially correct the provided datasets.", "We also invite translations of the existing data to more languages.", - "", "We do not anticipate any risk from underage or other users, hence we do not restrict access to anyone." ], - "griefAbuseHarassmentProtection": "No", + "griefAbuseHarassmentProtection": "Yes", "harassmentProtectionSteps": [ - "" + "we strongly encourage that professional translators handle the technical content, and that you follow a rigorous process of Quality Assurance over the produced translations. " ] } }, From 9441e0e02dc8a702d74896d16dc0e4739f7ebd85 Mon Sep 17 00:00:00 2001 From: Nathan Baleeta Date: Thu, 31 Mar 2022 17:12:09 +0300 Subject: [PATCH 5/5] Updated developmentCountries field --- digitalpublicgoods/translation-initiative-for-covid-19.json | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/digitalpublicgoods/translation-initiative-for-covid-19.json b/digitalpublicgoods/translation-initiative-for-covid-19.json index 063a4894c..f190e888e 100644 --- a/digitalpublicgoods/translation-initiative-for-covid-19.json +++ b/digitalpublicgoods/translation-initiative-for-covid-19.json @@ -82,9 +82,9 @@ }, "locations": { "developmentCountries": [ - "USA", + "United States of America", "Ireland", - "UK", + "United Kingdom", "Canada", "Spain", "Italy",