From 54e235f76975e28a73a165551429f379dd6f4af2 Mon Sep 17 00:00:00 2001 From: Maarten van Gompel Date: Fri, 22 Jul 2022 20:40:14 +0200 Subject: [PATCH] codemeta.json: updating according to (proposed) CLARIAH requirements (CLARIAH/clariah-plus#38) --- codemeta.json | 106 ++++++++++++++++++++++---------------------------- 1 file changed, 47 insertions(+), 59 deletions(-) diff --git a/codemeta.json b/codemeta.json index 1a59117..a24fea1 100644 --- a/codemeta.json +++ b/codemeta.json @@ -1,14 +1,15 @@ { "@context": [ "https://doi.org/10.5063/schema/codemeta-2.0", - "http://schema.org" + "http://schema.org", + "https://w3id.org/software-types" ], "@type": "SoftwareSourceCode", "identifier": "colibricore", "name": "Colibri Core", - "version": "2.5.5", + "version": "2.5.6", "description": "Colibri core is an NLP tool as well as a C++ and Python library for working with basic linguistic constructions such as n-grams and skipgrams (i.e patterns with one or more gaps, either of fixed or dynamic size) in a quick and memory-efficient way. ", - "license": "https://spdx.org/licenses/GPL-3.0", + "license": "https://spdx.org/licenses/GPL-3.0-only", "url": "https://proycon.github.io/colibri-core", "author": [ { @@ -35,7 +36,6 @@ } } ], - "sourceOrganization": { "@id": "https://www.ru.nl/cls" }, "programmingLanguage": [{ "@type": "ComputerLanguage", "identifier": "c++", @@ -47,14 +47,15 @@ "name": "Cython" } ], - "operatingSystem": "POSIX", + "operatingSystem": [ "Linux", "BSD" ,"macOS" ], "codeRepository": "https://github.com/proycon/colibri-core", "softwareRequirements": [ ], + "softwareHelp": "https://proycon.github.io/colibri-core/doc/", "readme": "https://github.com/proycon/colibri-core/blob/master/README.md", "issueTracker": "https://github.com/proycon/colibri-core/issues", "contIntegration": "https://travis-ci.org/proycon/colibri-core", "releaseNotes": "https://github.com/proycon/colibri-core/releases", - "developmentStatus": "active", + "developmentStatus": "https://www.repostatus.org/#active", "keywords": [ "nlp", "natural language processing", "ngrams", "skipgrams", "pattern recognition", "language modelling" ], "referencePublication": [ { @@ -72,97 +73,84 @@ } ], "dateCreated": "2013-09-15", - "entryPoints": [ + "targetProduct": [ { - "@type": "EntryPoint", + "@type": "CommandLineApplication", "name": "colibri-classencode", - "urlTemplate": "file:///colibri-classencode", - "description": "Encodes a plain text corpus to a binary encoded corpus and a class file", - "interfaceType": "CLI" + "executableName": "colibri-classencode", + "description": "Encodes a plain text corpus to a binary encoded corpus and a class file" }, { - "@type": "EntryPoint", + "@type": "CommandLineApplication", "name": "colibri-classdecode", - "urlTemplate": "file:///colibri-classdecode", - "description": "Decodes a binary encoded corpus and a class file to a plain text corpus", - "interfaceType": "CLI" + "executableName": "colibri-classdecode", + "description": "Decodes a binary encoded corpus and a class file to a plain text corpus" }, { - "@type": "EntryPoint", + "@type": "CommandLineApplication", "name": "colibri-patternmodeller", - "urlTemplate": "file:///colibri-patternmodeller", - "description": "Extract, model and compare recurring patterns (n-grams, skipgrams, flexgrams) and their frequencies in text corpus data. This is the main tool of Colibri Core.", - "interfaceType": "CLI" + "executableName": "colibri-patternmodeller", + "description": "Extract, model and compare recurring patterns (n-grams, skipgrams, flexgrams) and their frequencies in text corpus data. This is the main tool of Colibri Core." }, { - "@type": "EntryPoint", + "@type": "CommandLineApplication", "name": "colibri-cooc", - "urlTemplate": "file:///colibri-cooc", - "description": "Computes co-occurrence statistics (absolute co-cooccurrence or pointwise mutual information) between patterns in a corpus", - "interfaceType": "CLI" + "executableName": "colibri-cooc", + "description": "Computes co-occurrence statistics (absolute co-cooccurrence or pointwise mutual information) between patterns in a corpus" }, { - "@type": "EntryPoint", + "@type": "CommandLineApplication", "name": "colibri-ngrams", - "urlTemplate": "file:///colibri-ngrams", - "description": "Extract n-grams of a particular size by moving a sliding window over the corpus. This is a high-level convenience script over underlying tools.", - "interfaceType": "CLI" + "executableName": "colibri-ngrams", + "description": "Extract n-grams of a particular size by moving a sliding window over the corpus. This is a high-level convenience script over underlying tools." }, { - "@type": "EntryPoint", + "@type": "CommandLineApplication", "name": "colibri-freqlist", - "urlTemplate": "file:///colibri-freqlist", - "description": "Extract n-grams (and optionally skipgrams) with their counts from one or more plain-text corpus files. This is a high-level convenience script over underlying tools.", - "interfaceType": "CLI" + "executableName": "colibri-freqlist", + "description": "Extract n-grams (and optionally skipgrams) with their counts from one or more plain-text corpus files. This is a high-level convenience script over underlying tools." }, { - "@type": "EntryPoint", + "@type": "CommandLineApplication", "name": "colibri-coverage", - "urlTemplate": "file:///colibri-coverage", - "description": "Computes the coverage of training/background corpus on a particular test/foreground corpus, i.e how many of the patterns in the test corpus were found during training, how many tokens are covered, and how is this all distributed?. This is a high-level convenience script over underlying tools.", - "interfaceType": "CLI" + "executableName": "colibri-coverage", + "description": "Computes the coverage of training/background corpus on a particular test/foreground corpus, i.e how many of the patterns in the test corpus were found during training, how many tokens are covered, and how is this all distributed?. This is a high-level convenience script over underlying tools." }, { - "@type": "EntryPoint", + "@type": "CommandLineApplication", "name": "colibri-findpatterns", - "urlTemplate": "file:///colibri-findpatterns", - "description": "Find patterns in corpus data based on a presupplied list of patterns (one per line). This is a high-level convenience script over underlying tools.", - "interfaceType": "CLI" + "executableName": "colibri-findpatterns", + "description": "Find patterns in corpus data based on a presupplied list of patterns (one per line). This is a high-level convenience script over underlying tools." }, { - "@type": "EntryPoint", + "@type": "CommandLineApplication", "name": "colibri-histogram", - "urlTemplate": "file:///colibri-histogram", - "description": "Computes a histogram for ngram occurrences (and optionally skipgrams) in the corpus. This is a high-level convenience script over underlying tools.", - "interfaceType": "CLI" + "executableName": "colibri-histogram", + "description": "Computes a histogram for ngram occurrences (and optionally skipgrams) in the corpus. This is a high-level convenience script over underlying tools." }, { - "@type": "EntryPoint", + "@type": "CommandLineApplication", "name": "colibri-loglikelihood", - "urlTemplate": "file:///colibri-loglikelihood", - "description": "Compares the frequency of patterns between two or more corpus files (plain text) by computing log likelihood, following the methodology of Rayson and Garside (2000), Comparing corpora using frequency profiling. In proceedings of the workshop on Comparing Corpora, held in conjunction with the 38th annual meeting of the Association for Computational Linguistics (ACL 2000). 1-8 October 2000, Hong Kong, pp. 1 - 6: http://www.comp.lancs.ac.uk/~paul/publications/rg_acl2000.pdf. This is a high-level convenience script over underlying tools.", - "interfaceType": "CLI" + "executableName": "colibri-loglikelihood", + "description": "Compares the frequency of patterns between two or more corpus files (plain text) by computing log likelihood, following the methodology of Rayson and Garside (2000), Comparing corpora using frequency profiling. In proceedings of the workshop on Comparing Corpora, held in conjunction with the 38th annual meeting of the Association for Computational Linguistics (ACL 2000). 1-8 October 2000, Hong Kong, pp. 1 - 6: http://www.comp.lancs.ac.uk/~paul/publications/rg_acl2000.pdf. This is a high-level convenience script over underlying tools." }, { - "@type": "EntryPoint", + "@type": "CommandLineApplication", "name": "colibri-ngramstats", - "urlTemplate": "file:///colibri-ngramstats", - "description": "Computes a summary report on the count of ngrams (and optionally skipgrams) in the corpus. This is a high-level convenience script over underlying tools.", - "interfaceType": "CLI" + "executableName": "colibri-ngramstats", + "description": "Computes a summary report on the count of ngrams (and optionally skipgrams) in the corpus. This is a high-level convenience script over underlying tools." }, { - "@type": "EntryPoint", + "@type": "CommandLineApplication", "name": "colibri-queryngrams", - "urlTemplate": "file:///colibri-queryngrams", - "description": "Interactive command line tool to n-grams with their counts from one or more plain-text corpus files. This is a high-level convenience script over underlying tools.", - "interfaceType": "CLI" + "executableName": "colibri-queryngrams", + "description": "Interactive command line tool to n-grams with their counts from one or more plain-text corpus files. This is a high-level convenience script over underlying tools." }, { - "@type": "EntryPoint", + "@type": "CommandLineApplication", "name": "colibri-reverseindex", - "urlTemplate": "file:///colibri-reverseindex", - "description": "Computes and prints reverse index of the corpus, for each token position in the corpus, all patterns that start at that position are shown. This is a high-level convenience script over underlying tools.", - "interfaceType": "CLI" + "executableName": "colibri-reverseindex", + "description": "Computes and prints reverse index of the corpus, for each token position in the corpus, all patterns that start at that position are shown. This is a high-level convenience script over underlying tools." } ] }