Skip to content

Commit

Permalink
codemeta.json: updating according to (proposed) CLARIAH requirements (C…
Browse files Browse the repository at this point in the history
  • Loading branch information
proycon committed Jul 22, 2022
1 parent 33a5506 commit 54e235f
Showing 1 changed file with 47 additions and 59 deletions.
106 changes: 47 additions & 59 deletions codemeta.json
Original file line number Diff line number Diff line change
@@ -1,14 +1,15 @@
{
"@context": [
"https://doi.org/10.5063/schema/codemeta-2.0",
"http://schema.org"
"http://schema.org",
"https://w3id.org/software-types"
],
"@type": "SoftwareSourceCode",
"identifier": "colibricore",
"name": "Colibri Core",
"version": "2.5.5",
"version": "2.5.6",
"description": "Colibri core is an NLP tool as well as a C++ and Python library for working with basic linguistic constructions such as n-grams and skipgrams (i.e patterns with one or more gaps, either of fixed or dynamic size) in a quick and memory-efficient way. ",
"license": "https://spdx.org/licenses/GPL-3.0",
"license": "https://spdx.org/licenses/GPL-3.0-only",
"url": "https://proycon.github.io/colibri-core",
"author": [
{
Expand All @@ -35,7 +36,6 @@
}
}
],
"sourceOrganization": { "@id": "https://www.ru.nl/cls" },
"programmingLanguage": [{
"@type": "ComputerLanguage",
"identifier": "c++",
Expand All @@ -47,14 +47,15 @@
"name": "Cython"
}
],
"operatingSystem": "POSIX",
"operatingSystem": [ "Linux", "BSD" ,"macOS" ],
"codeRepository": "https://github.com/proycon/colibri-core",
"softwareRequirements": [ ],
"softwareHelp": "https://proycon.github.io/colibri-core/doc/",
"readme": "https://github.com/proycon/colibri-core/blob/master/README.md",
"issueTracker": "https://github.com/proycon/colibri-core/issues",
"contIntegration": "https://travis-ci.org/proycon/colibri-core",
"releaseNotes": "https://github.com/proycon/colibri-core/releases",
"developmentStatus": "active",
"developmentStatus": "https://www.repostatus.org/#active",
"keywords": [ "nlp", "natural language processing", "ngrams", "skipgrams", "pattern recognition", "language modelling" ],
"referencePublication": [
{
Expand All @@ -72,97 +73,84 @@
}
],
"dateCreated": "2013-09-15",
"entryPoints": [
"targetProduct": [
{
"@type": "EntryPoint",
"@type": "CommandLineApplication",
"name": "colibri-classencode",
"urlTemplate": "file:///colibri-classencode",
"description": "Encodes a plain text corpus to a binary encoded corpus and a class file",
"interfaceType": "CLI"
"executableName": "colibri-classencode",
"description": "Encodes a plain text corpus to a binary encoded corpus and a class file"
},
{
"@type": "EntryPoint",
"@type": "CommandLineApplication",
"name": "colibri-classdecode",
"urlTemplate": "file:///colibri-classdecode",
"description": "Decodes a binary encoded corpus and a class file to a plain text corpus",
"interfaceType": "CLI"
"executableName": "colibri-classdecode",
"description": "Decodes a binary encoded corpus and a class file to a plain text corpus"
},
{
"@type": "EntryPoint",
"@type": "CommandLineApplication",
"name": "colibri-patternmodeller",
"urlTemplate": "file:///colibri-patternmodeller",
"description": "Extract, model and compare recurring patterns (n-grams, skipgrams, flexgrams) and their frequencies in text corpus data. This is the main tool of Colibri Core.",
"interfaceType": "CLI"
"executableName": "colibri-patternmodeller",
"description": "Extract, model and compare recurring patterns (n-grams, skipgrams, flexgrams) and their frequencies in text corpus data. This is the main tool of Colibri Core."
},
{
"@type": "EntryPoint",
"@type": "CommandLineApplication",
"name": "colibri-cooc",
"urlTemplate": "file:///colibri-cooc",
"description": "Computes co-occurrence statistics (absolute co-cooccurrence or pointwise mutual information) between patterns in a corpus",
"interfaceType": "CLI"
"executableName": "colibri-cooc",
"description": "Computes co-occurrence statistics (absolute co-cooccurrence or pointwise mutual information) between patterns in a corpus"
},
{
"@type": "EntryPoint",
"@type": "CommandLineApplication",
"name": "colibri-ngrams",
"urlTemplate": "file:///colibri-ngrams",
"description": "Extract n-grams of a particular size by moving a sliding window over the corpus. This is a high-level convenience script over underlying tools.",
"interfaceType": "CLI"
"executableName": "colibri-ngrams",
"description": "Extract n-grams of a particular size by moving a sliding window over the corpus. This is a high-level convenience script over underlying tools."
},
{
"@type": "EntryPoint",
"@type": "CommandLineApplication",
"name": "colibri-freqlist",
"urlTemplate": "file:///colibri-freqlist",
"description": "Extract n-grams (and optionally skipgrams) with their counts from one or more plain-text corpus files. This is a high-level convenience script over underlying tools.",
"interfaceType": "CLI"
"executableName": "colibri-freqlist",
"description": "Extract n-grams (and optionally skipgrams) with their counts from one or more plain-text corpus files. This is a high-level convenience script over underlying tools."
},
{
"@type": "EntryPoint",
"@type": "CommandLineApplication",
"name": "colibri-coverage",
"urlTemplate": "file:///colibri-coverage",
"description": "Computes the coverage of training/background corpus on a particular test/foreground corpus, i.e how many of the patterns in the test corpus were found during training, how many tokens are covered, and how is this all distributed?. This is a high-level convenience script over underlying tools.",
"interfaceType": "CLI"
"executableName": "colibri-coverage",
"description": "Computes the coverage of training/background corpus on a particular test/foreground corpus, i.e how many of the patterns in the test corpus were found during training, how many tokens are covered, and how is this all distributed?. This is a high-level convenience script over underlying tools."
},
{
"@type": "EntryPoint",
"@type": "CommandLineApplication",
"name": "colibri-findpatterns",
"urlTemplate": "file:///colibri-findpatterns",
"description": "Find patterns in corpus data based on a presupplied list of patterns (one per line). This is a high-level convenience script over underlying tools.",
"interfaceType": "CLI"
"executableName": "colibri-findpatterns",
"description": "Find patterns in corpus data based on a presupplied list of patterns (one per line). This is a high-level convenience script over underlying tools."
},
{
"@type": "EntryPoint",
"@type": "CommandLineApplication",
"name": "colibri-histogram",
"urlTemplate": "file:///colibri-histogram",
"description": "Computes a histogram for ngram occurrences (and optionally skipgrams) in the corpus. This is a high-level convenience script over underlying tools.",
"interfaceType": "CLI"
"executableName": "colibri-histogram",
"description": "Computes a histogram for ngram occurrences (and optionally skipgrams) in the corpus. This is a high-level convenience script over underlying tools."
},
{
"@type": "EntryPoint",
"@type": "CommandLineApplication",
"name": "colibri-loglikelihood",
"urlTemplate": "file:///colibri-loglikelihood",
"description": "Compares the frequency of patterns between two or more corpus files (plain text) by computing log likelihood, following the methodology of Rayson and Garside (2000), Comparing corpora using frequency profiling. In proceedings of the workshop on Comparing Corpora, held in conjunction with the 38th annual meeting of the Association for Computational Linguistics (ACL 2000). 1-8 October 2000, Hong Kong, pp. 1 - 6: http://www.comp.lancs.ac.uk/~paul/publications/rg_acl2000.pdf. This is a high-level convenience script over underlying tools.",
"interfaceType": "CLI"
"executableName": "colibri-loglikelihood",
"description": "Compares the frequency of patterns between two or more corpus files (plain text) by computing log likelihood, following the methodology of Rayson and Garside (2000), Comparing corpora using frequency profiling. In proceedings of the workshop on Comparing Corpora, held in conjunction with the 38th annual meeting of the Association for Computational Linguistics (ACL 2000). 1-8 October 2000, Hong Kong, pp. 1 - 6: http://www.comp.lancs.ac.uk/~paul/publications/rg_acl2000.pdf. This is a high-level convenience script over underlying tools."
},
{
"@type": "EntryPoint",
"@type": "CommandLineApplication",
"name": "colibri-ngramstats",
"urlTemplate": "file:///colibri-ngramstats",
"description": "Computes a summary report on the count of ngrams (and optionally skipgrams) in the corpus. This is a high-level convenience script over underlying tools.",
"interfaceType": "CLI"
"executableName": "colibri-ngramstats",
"description": "Computes a summary report on the count of ngrams (and optionally skipgrams) in the corpus. This is a high-level convenience script over underlying tools."
},
{
"@type": "EntryPoint",
"@type": "CommandLineApplication",
"name": "colibri-queryngrams",
"urlTemplate": "file:///colibri-queryngrams",
"description": "Interactive command line tool to n-grams with their counts from one or more plain-text corpus files. This is a high-level convenience script over underlying tools.",
"interfaceType": "CLI"
"executableName": "colibri-queryngrams",
"description": "Interactive command line tool to n-grams with their counts from one or more plain-text corpus files. This is a high-level convenience script over underlying tools."
},
{
"@type": "EntryPoint",
"@type": "CommandLineApplication",
"name": "colibri-reverseindex",
"urlTemplate": "file:///colibri-reverseindex",
"description": "Computes and prints reverse index of the corpus, for each token position in the corpus, all patterns that start at that position are shown. This is a high-level convenience script over underlying tools.",
"interfaceType": "CLI"
"executableName": "colibri-reverseindex",
"description": "Computes and prints reverse index of the corpus, for each token position in the corpus, all patterns that start at that position are shown. This is a high-level convenience script over underlying tools."
}
]
}

0 comments on commit 54e235f

Please sign in to comment.