{
    "@context": [
        "https://w3id.org/codemeta/3.0",
        "https://w3id.org/software-iodata",
        "https://w3id.org/nwo-research-fields",
        "https://raw.githubusercontent.com/jantman/repostatus.org/master/badges/latest/ontology.jsonld",
        "https://w3id.org/research-technology-readiness-levels",
        "https://schema.org",
        "https://w3id.org/software-types"
    ],
    "@id": "https://tools.clariah.nl/mbt/3.11",
    "@type": "SoftwareSourceCode",
    "author": [
        {
            "@type": "Person",
            "affiliation": {
                "@id": "https://www.ru.nl/clst",
                "@type": "Organization",
                "name": "Centre for Language and Speech Technology",
                "parentOrganization": {
                    "@id": "https://www.ru.nl/cls",
                    "@type": "Organization",
                    "name": "Centre for Language Studies",
                    "parentOrganization": {
                        "@id": "https://www.ru.nl",
                        "@type": "Organization",
                        "location": {
                            "@type": "Place",
                            "name": "Nijmegen"
                        },
                        "name": "Radboud University",
                        "url": "https://www.ru.nl"
                    },
                    "url": "https://www.ru.nl/cls"
                },
                "url": "https://www.ru.nl/clst"
            },
            "email": "ko.vandersloot@let.ru.nl",
            "familyName": "van der Sloot",
            "givenName": "Ko"
        },
        {
            "@id": "https://orcid.org/0000-0003-2493-656X",
            "@type": "Person",
            "affiliation": {
                "@id": "https://cls.ru.nl"
            },
            "email": "antal.vandenbosch@let.ru.nl",
            "familyName": "van den Bosch",
            "givenName": "Antal",
            "position": 2
        },
        {
            "@type": "Person",
            "familyName": "Daelemans",
            "givenName": "Walter"
        },
        {
            "@type": "Person",
            "familyName": "Zavrel",
            "givenName": "Jakub"
        }
    ],
    "codeRepository": "https://github.com/LanguageMachines/mbt",
    "continuousIntegration": {
        "@id": "https://travis-ci.org/LanguageMachines/mbt"
    },
    "contributor": [
        {
            "@type": "Person",
            "affiliation": {
                "@id": "https://www.ru.nl/clst",
                "@type": "Organization",
                "name": "Centre for Language and Speech Technology",
                "parentOrganization": {
                    "@id": "https://www.ru.nl/cls",
                    "@type": "Organization",
                    "name": "Centre for Language Studies",
                    "parentOrganization": {
                        "@id": "https://www.ru.nl",
                        "@type": "Organization",
                        "location": {
                            "@type": "Place",
                            "name": "Nijmegen"
                        },
                        "name": "Radboud University",
                        "url": "https://www.ru.nl"
                    },
                    "url": "https://www.ru.nl/cls"
                },
                "url": "https://www.ru.nl/clst"
            },
            "email": "ko.vandersloot@let.ru.nl",
            "familyName": "van der Sloot",
            "givenName": "Ko"
        },
        {
            "@id": "https://orcid.org/0000-0003-2493-656X",
            "@type": "Person",
            "affiliation": {
                "@id": "https://cls.ru.nl"
            },
            "email": "antal.vandenbosch@let.ru.nl",
            "familyName": "van den Bosch",
            "givenName": "Antal",
            "position": 2
        },
        {
            "@type": "Person",
            "familyName": "Daelemans",
            "givenName": "Walter"
        },
        {
            "@type": "Person",
            "familyName": "Zavrel",
            "givenName": "Jakub"
        }
    ],
    "description": "MBT is a memory-based tagger-generator and tagger in one. The tagger-generator part can generate a sequence tagger on the basis of a training set of tagged sequences; the tagger part can tag new sequences. MBT can, for instance, be used to generate part-of-speech taggers or chunkers for natural language processing. It has also been used for named-entity recognition, information extraction in domain-specific texts, and disfluency chunking in transcribed speech. ",
    "developmentStatus": {
        "@id": "https://www.repostatus.org/#active",
        "@type": "skos:Concept",
        "og:image": "https://www.repostatus.org/badges/latest/active.svg",
        "skos:definition": "The project has reached a stable, usable state and is being actively developed.",
        "skos:inScheme": "https://www.repostatus.org",
        "skos:prefLabel": "Active"
    },
    "https://github.com/proycon/codemetapy/errors": 0,
    "https://github.com/proycon/codemetapy/log": "(log file starts at Thu Jun 18 03:14:48 UTC 2026)\n\n[harvester info] --> Processing mbt (https://github.com/LanguageMachines/mbt) [Thu Jun 18 03:14:48 UTC 2026]\n\n[harvester info] Git updating cached clone of https://github.com/LanguageMachines/mbt...\n\n[harvester info] Found release v3.11\n\n[harvester info] Using 'v3.11'\n\n[harvester info] Git reference: v3.11\n\n[harvester info] Scanning directory /tmp/codemeta-harvester.cache/mbt for harvestable resources...\n\n[harvester info] found codemeta.json for mbt (md5sum 1144001f8e312622e9c47ffd33c926a7); **NOTE: this is considered authoritative and most other detection methods will be skipped now!**\n\n[harvester info] Inferring repostatus information from git activity (used only as a fallback if not explicitly provided)...\n\n[harvester info] Inferred repostatus https://www.repostatus.org/#active\n\n[harvester info] Looking for repostatus information in README.md in master branch...\n\n[harvester info] Looking for repostatus information in README in master branch...\n\n[harvester info] Parsing MAINTAINERS from master branch...\n\n[harvester info] Reconciliating: codemetapy  --baseuri https://tools.clariah.nl --baseuri https://tools.clariah.nl --includecontext --addcontext https://w3id.org/nwo-research-fields --addcontext https://w3id.org/research-technology-readiness-levels --addcontextgraph https://vocabs.dariah.eu/rest/v1/tadirah/data?format=text/turtle --trl --identifier \"mbt\" --codeRepository \"https://github.com/LanguageMachines/mbt\" --validate /etc/software.ttl --released --enrich --textv \"Please consult the CLARIAH Software Metadata Requirements at https://github.com/CLARIAH/clariah-plus/blob/main/requirements/software-metadata-requirements.md for an in-depth explanation of any found problems\" -O /tmp/out/mbt.codemeta.json /tmp/codemeta-harvester.cache//tmp/99-repostatus.mbt.codemeta.json /tmp/codemeta-harvester.cache//tmp/10-jsonld.mbt.codemeta.json /tmp/codemeta-harvester.cache//tmp/05-maintainers.mbt.codemeta.json \n\n-- begin log --\n\nPassed 3 files/sources but specified 0 input types! Automatically guessing types...\n\nDetected input types: [('/tmp/codemeta-harvester.cache//tmp/99-repostatus.mbt.codemeta.json', 'json'), ('/tmp/codemeta-harvester.cache//tmp/10-jsonld.mbt.codemeta.json', 'json'), ('/tmp/codemeta-harvester.cache//tmp/05-maintainers.mbt.codemeta.json', 'json')]\n\nAdding to contextgraph: /tmp/turtle\n\nInitial URI automatically generated, may be overriden later: https://tools.clariah.nl/mbt\n\nProcessing source #1 of 3\n\nParsing json-ld file from /tmp/codemeta-harvester.cache//tmp/99-repostatus.mbt.codemeta.json\n\n    NOTE: Not a valid JSON-LD document, @context missing! Attempting to inject automatically...\n\n    Injected (possibly temporary) URI https://tools.clariah.nl/mbt\n\n[CODEMETA COMPOSITION (https://tools.clariah.nl/mbt)] processed 1 new triples, total is now 2\n\nProcessing source #2 of 3\n\nParsing json-ld file from /tmp/codemeta-harvester.cache//tmp/10-jsonld.mbt.codemeta.json\n\n    Injected (possibly temporary) URI https://tools.clariah.nl/mbt\n\n[CODEMETA 2 TO 3] Updating contIntegration -> continuousIntegration\n\n[CODEMETA 2 TO 3] Updating targetProduct -> isSourceCodeOf\n\n[CODEMETA 2 TO 3] Updating targetProduct -> isSourceCodeOf\n\n[CODEMETA CORRECTION (mbt)] automatically converting spdx license URI from https:// to http:///\n\n[CODEMETA COMPOSITION (mbt)] processed 112 new triples, total is now 112\n\nProcessing source #3 of 3\n\nParsing json-ld file from /tmp/codemeta-harvester.cache//tmp/05-maintainers.mbt.codemeta.json\n\n    Found main resource with URI https://tools.clariah.nl/maintainers/snapshot\n\n    Injected (possibly temporary) URI https://tools.clariah.nl/mbt\n\n[CODEMETA COMPOSITION (mbt)] processed 14 new triples, total is now 125\n\nRemapping URI to (possibly) new identifier and version component: https://tools.clariah.nl/mbt -> https://tools.clariah.nl/mbt/3.11\n\n[CODEMETA VALIDATION (mbt)] done\n\n[CODEMETA ENRICHMENT (mbt)] adding author https://tools.clariah.nl/stub/H-274d12090545b345 as contributor\n\n[CODEMETA ENRICHMENT (mbt)] adding author https://orcid.org/0000-0003-2493-656X as contributor\n\n[CODEMETA ENRICHMENT (mbt)] adding author https://tools.clariah.nl/stub/H5823b4ae69a0f5d4 as contributor\n\n[CODEMETA ENRICHMENT (mbt)] adding author https://tools.clariah.nl/stub/H-95a6a0ca9d9a5db as contributor\n\nVALIDATION https://tools.clariah.nl/mbt/3.11 #1: Warning: Documentation *SHOULD* be expressed (This is missing in the metadata)\n\nVALIDATION https://tools.clariah.nl/mbt/3.11 #2: Info: Reference publications *SHOULD* be expressed, if any (The metadata does express this currently, but something is wrong in the way it is expressed. Is the type/class valid?)\n\nVALIDATION https://tools.clariah.nl/mbt/3.11 #3: Info: The funder *SHOULD* be acknowledged (This is missing in the metadata)\n\nVALIDATION https://tools.clariah.nl/mbt/3.11 #4: Info: The technology readiness level *SHOULD* be expressed (This is missing in the metadata)\n\nVALIDATION https://tools.clariah.nl/mbt/3.11 #5: Info: A research domain *SHOULD* be expressed as a category using the NWO Research Fields vocabulary, if applicable (This is missing in the metadata)\n\nVALIDATION https://tools.clariah.nl/mbt/3.11 #6: Info: A research activity *SHOULD* be expressed as a category using the TaDiRaH vocabulary (This is missing in the metadata)\n\n-- end log --\n\n[harvester info] Output written to /tmp/out/mbt.codemeta.json\n\n[harvester info] <-- Finished processing mbt (https://github.com/LanguageMachines/mbt) [Thu Jun 18 03:14:52 UTC 2026]\n",
    "identifier": "mbt",
    "isSourceCodeOf": [
        {
            "@type": "SoftwareLibrary",
            "description": "Memory-based Tagging Library with API for C++",
            "executableName": "libmbt",
            "name": "libmbt",
            "runtimePlatform": [
                "BSD",
                "Linux",
                "macOS"
            ]
        },
        {
            "@type": "CommandLineApplication",
            "description": "Memory-based tagger, command-line tool",
            "executableName": "mbt",
            "name": "mbt",
            "runtimePlatform": [
                "BSD",
                "Linux",
                "macOS"
            ]
        }
    ],
    "issueTracker": "https://github.com/LanguageMachines/mbt/issues",
    "keywords": [
        "machine learning",
        "memory based learning",
        "natural language processing",
        "nlp",
        "tagger"
    ],
    "license": {
        "@id": "http://spdx.org/licenses/GPL-3.0"
    },
    "maintainer": [
        {
            "@id": "https://tools.clariah.nl/person/maarten-van-gompel",
            "@type": "Person",
            "affiliation": [
                {
                    "@id": "https://tools.clariah.nl/org/knaw-humanities-cluster",
                    "@type": "Organization",
                    "name": "KNAW Humanities Cluster",
                    "url": "https://huc.knaw.nl/"
                },
                {
                    "@id": "https://tools.clariah.nl/org/knaw-humanities-cluster-clst-radboud-university",
                    "@type": "Organization",
                    "name": "KNAW Humanities Cluster & CLST, Radboud University"
                }
            ],
            "email": "proycon@anaproy.nl",
            "familyName": [
                "van Gompel",
                "van gompel"
            ],
            "givenName": "Maarten",
            "url": "https://proycon.anaproy.nl"
        },
        {
            "@id": "https://tools.clariah.nl/person/ko-van-der-sloot",
            "@type": "Person",
            "email": [
                "K.vanderSloot@let.ru.nl",
                "Ko.vanderSloot@ziggo.nl"
            ],
            "familyName": "van der Sloot",
            "givenName": "Ko"
        }
    ],
    "name": "mbt",
    "operatingSystem": [
        "BSD",
        "Linux",
        "macOS"
    ],
    "owl:sameAs": {
        "@id": "https://tools.clariah.nl/maintainers/snapshot"
    },
    "producer": {
        "@id": "https://huc.knaw.nl",
        "@type": "Organization",
        "name": [
            "Humanities Cluster",
            "KNAW Humanities Cluster"
        ],
        "parentOrganization": {
            "@id": "https://knaw.nl",
            "@type": "Organization",
            "location": {
                "@type": "Place",
                "name": "Amsterdam"
            },
            "name": "KNAW",
            "url": "https://knaw.nl"
        },
        "url": "https://huc.knaw.nl"
    },
    "programmingLanguage": {
        "@type": "ComputerLanguage",
        "identifier": "c++",
        "name": "C++"
    },
    "readme": "https://github.com/LanguageMachines/mbt/blob/master/README.md",
    "referencePublication": {
        "@type": "Book",
        "author": [
            "Walter Daelemans",
            "Antal van den Bosch"
        ],
        "name": "Memory-Based Language Processing",
        "publisher": "Cambridge University Press",
        "url": "http://ilk.uvt.nl/mblp"
    },
    "releaseNotes": "https://github.com/LanguageMachines/mbt/releases",
    "review": {
        "@id": "https://tools.clariah.nl/validation/N5e8013314e2a1324ef92e277d4e52f6e",
        "@type": "Review",
        "author": [
            "codemetapy validator using software.ttl"
        ],
        "datePublished": "2026-06-18 03:14:52",
        "name": "Automatic software metadata validation report for mbt 3.11",
        "reviewBody": "Please consult the CLARIAH Software Metadata Requirements at https://github.com/CLARIAH/clariah-plus/blob/main/requirements/software-metadata-requirements.md for an in-depth explanation of any found problems\n\nValidation of mbt 3.11 was successful (score=3/5), but there are some warnings which should be addressed:\n\n1. Warning: Documentation *SHOULD* be expressed (This is missing in the metadata)\n2. Info: Reference publications *SHOULD* be expressed, if any (The metadata does express this currently, but something is wrong in the way it is expressed. Is the type/class valid?)\n3. Info: The funder *SHOULD* be acknowledged (This is missing in the metadata)\n4. Info: The technology readiness level *SHOULD* be expressed (This is missing in the metadata)\n5. Info: A research domain *SHOULD* be expressed as a category using the NWO Research Fields vocabulary, if applicable (This is missing in the metadata)\n6. Info: A research activity *SHOULD* be expressed as a category using the TaDiRaH vocabulary (This is missing in the metadata)",
        "reviewRating": 3
    },
    "softwareRequirements": [
        {
            "@type": "SoftwareApplication",
            "identifier": "libxml2",
            "name": "libxml2"
        },
        {
            "@type": "SoftwareApplication",
            "identifier": "ticcutils",
            "name": "ticcutils"
        },
        {
            "@type": "SoftwareApplication",
            "identifier": "timbl",
            "name": "timbl"
        }
    ],
    "url": "https://languagemachines.github.io/mbt",
    "version": "3.11"
}