@prefix codemeta: .
@prefix dcterms: .
@prefix iodata: .
@prefix ns1: .
@prefix ns2: .
@prefix owl: .
@prefix rdf: .
@prefix rdfs: .
@prefix sdo: .
@prefix skos: .
@prefix stype: .
@prefix xsd: .
a rdfs:Class .
a skos:Concept,
;
skos:inScheme "https://w3id.org/nwo-research-fields#Scheme" ;
skos:prefLabel "Computers and the humanities" .
a skos:ConceptScheme ;
dcterms:creator "Maarten van Gompel" ;
dcterms:description "Ontology of the NWO Research fields, as used in grant applications by the Dutch Research Council (NWO): https://www.nwo.nl/en/nwo-research-fields" ;
dcterms:title "NWO Research Fields" .
a skos:Concept,
;
skos:broader "https://w3id.org/nwo-research-fields#ComputersAndTheHumanities" ;
skos:inScheme "https://w3id.org/nwo-research-fields#Scheme" ;
skos:notation "37.10.00" ;
skos:prefLabel "Software for humanities" .
a skos:ConceptScheme ;
dcterms:creator "Jason Antman" ;
dcterms:description "A standard to easily communicate to humans and machines the development/support and usability status of software repositories/projects." ;
dcterms:title "repostatus.org" .
sdo:WebApplication rdfs:label "Web Application" ;
rdfs:comment "A software application served as a service over the web with an interface for human end-users" .
sdo:name "GNU Affero General Public License v3" .
a owl:NamedIndividual,
skos:Concept ;
skos:broader ;
skos:definition "Wikidata contributors, \"Q98846987,\" Wikidata, https://www.wikidata.org/w/index.php?title=Q98846987&oldid=1270659968 (accessed September 4, 2020)."@en ;
skos:prefLabel "Speech Recognizing"@en .
a skos:Concept,
;
skos:broader "trl:Stage4Complete" ;
skos:definition "Technology complete and proven in practice by real users." ;
skos:inScheme "trl:Scheme" ;
skos:notation "9" ;
skos:prefLabel "9 - Proven" .
a sdo:SoftwareSourceCode ;
sdo:applicationCategory ,
"https://w3id.org/nwo-research-fields#SoftwareForHumanities" ;
sdo:author ;
sdo:codeRepository ;
sdo:contributor ;
sdo:dateCreated "2017-04-02"^^sdo:Date ;
sdo:description "This is a web-based automatic speech recogniser for Dutch, capable of transcribing dutch speech recordings using multiple models." ;
sdo:identifier "asr_nl" ;
sdo:keywords "dutch",
"nlp",
"speech recognition" ;
sdo:license ;
sdo:maintainer ;
sdo:name "Automatic Speech Recognition for Dutch" ;
sdo:operatingSystem "Linux" ;
sdo:producer ;
sdo:review ;
sdo:softwareRequirements ,
,
;
sdo:sourceOrganization ;
sdo:targetProduct ,
;
sdo:url ;
sdo:version "0.6.2" ;
owl:sameAs ;
codemeta:developmentStatus ,
;
codemeta:issueTracker ;
codemeta:readme ;
ns2:errors 0 ;
ns2:log """(log file starts at Sun Dec 22 04:00:57 UTC 2024)
[harvester info] --> Processing asr_nl (https://github.com/opensource-spraakherkenning-nl/asr_nl) [Sun Dec 22 04:00:57 UTC 2024]
[harvester info] Git updating cached clone of https://github.com/opensource-spraakherkenning-nl/asr_nl...
[harvester info] Found release v0.6.2
[harvester info] Using 'v0.6.2'
[harvester info] Git reference: v0.6.2
[harvester info] Scanning directory /tmp/codemeta-harvester.cache/asr_nl for harvestable resources...
[harvester info] found codemeta.json for asr_nl (md5sum c38d31855921f1b956862aa9c5b2bed7); **NOTE: this is considered authoritative and most other detection methods will be skipped now!**
[harvester info] Inferring repostatus information from git activity (used only as a fallback if not explicitly provided)...
[harvester info] Inferred repostatus https://www.repostatus.org/#inactive
[harvester info] Looking for repostatus information in README.md in master branch...
-- begin log --
-- end log --
[harvester info] Found README.md
[harvester info] Reconciliating: codemetapy --baseuri https://webservices.cls.ru.nl/portal --baseuri https://webservices.cls.ru.nl/portal --includecontext --addcontext https://w3id.org/nwo-research-fields --addcontext https://w3id.org/research-technology-readiness-levels --addcontextgraph https://vocabs.dariah.eu/rest/v1/tadirah/data?format=text/turtle --trl --identifier "asr_nl" --codeRepository "https://github.com/opensource-spraakherkenning-nl/asr_nl" --validate /etc/software.ttl --released --enrich --textv "Please consult the CLARIAH Software Metadata Requirements at https://github.com/CLARIAH/clariah-plus/blob/main/requirements/software-metadata-requirements.md for an in-depth explanation of any found problems" -O /tmp/out/asr_nl.codemeta.json /tmp/codemeta-harvester.cache//tmp/99-repostatus.asr_nl.codemeta.json /tmp/codemeta-harvester.cache//tmp/41-readme.asr_nl.codemeta.json /tmp/codemeta-harvester.cache//tmp/10-jsonld.asr_nl.codemeta.json
-- begin log --
Passed 3 files/sources but specified 0 input types! Automatically guessing types...
Detected input types: [('/tmp/codemeta-harvester.cache//tmp/99-repostatus.asr_nl.codemeta.json', 'json'), ('/tmp/codemeta-harvester.cache//tmp/41-readme.asr_nl.codemeta.json', 'json'), ('/tmp/codemeta-harvester.cache//tmp/10-jsonld.asr_nl.codemeta.json', 'json')]
Adding to contextgraph: /tmp/turtle
Initial URI automatically generated, may be overriden later: https://webservices.cls.ru.nl/portal/asr-nl
Processing source #1 of 3
Parsing json-ld file from /tmp/codemeta-harvester.cache//tmp/99-repostatus.asr_nl.codemeta.json
NOTE: Not a valid JSON-LD document, @context missing! Attempting to inject automatically...
Injected (possibly temporary) URI https://webservices.cls.ru.nl/portal/asr-nl
[CODEMETA COMPOSITION (https://webservices.cls.ru.nl/portal/asr-nl)] processed 1 new triples, total is now 2
Processing source #2 of 3
Parsing json-ld file from /tmp/codemeta-harvester.cache//tmp/41-readme.asr_nl.codemeta.json
NOTE: Not a valid JSON-LD document, @context missing! Attempting to inject automatically...
Injected (possibly temporary) URI https://webservices.cls.ru.nl/portal/asr-nl
[CODEMETA COMPOSITION (https://webservices.cls.ru.nl/portal/asr-nl)] processed 1 new triples, total is now 3
Processing source #3 of 3
Parsing json-ld file from /tmp/codemeta-harvester.cache//tmp/10-jsonld.asr_nl.codemeta.json
Injected (possibly temporary) URI https://webservices.cls.ru.nl/portal/asr-nl
[CODEMETA COMPOSITION (asr_nl)] overriding old https://codemeta.github.io/terms/readme (https://github.com/proycon/alpino_clam_webservice/blob/v0.6.2/README.md -> https://github.com/opensource-spraakherkenning-nl/asr_nl/blob/master/README.md)
[CODEMETA COMPOSITION (asr_nl)] overriding old https://codemeta.github.io/terms/developmentStatus (https://www.repostatus.org/#inactive -> https://www.repostatus.org/#active)
[CODEMETA CORRECTION (asr_nl)] automatically converting spdx license URI from https:// to http:///
[CODEMETA COMPOSITION (asr_nl)] processed 70 new triples, total is now 70
Remapping URI to (possibly) new identifier and version component: https://webservices.cls.ru.nl/portal/asr-nl -> https://webservices.cls.ru.nl/portal/asr_nl/0.6.2
[CODEMETA VALIDATION (asr_nl)] done
[CODEMETA ENRICHMENT (asr_nl)] Guessing interface type https://w3id.org/software-types#WebApplication based on clues
[CODEMETA ENRICHMENT (asr_nl)] adding author https://webservices.cls.ru.nl/portal/stub/H-72fbea18c5643ce1 as contributor
[CODEMETA ENRICHMENT (asr_nl)] adding author https://webservices.cls.ru.nl/portal/stub/H0ee3f79658e0da71 as contributor
[CODEMETA ENRICHMENT (asr_nl)] adding author https://webservices.cls.ru.nl/portal/stub/H-1863f5d541a99da4 as contributor
VALIDATION https://webservices.cls.ru.nl/portal/asr_nl/0.6.2 #1: Warning: Software source code *SHOULD* link to a continuous integration service that builds the software and runs the software's tests (This is missing in the metadata)
VALIDATION https://webservices.cls.ru.nl/portal/asr_nl/0.6.2 #2: Info: Software source code *MAY* express the programming language(s) used (This is missing in the metadata)
VALIDATION https://webservices.cls.ru.nl/portal/asr_nl/0.6.2 #3: Info: An interface type *SHOULD* be expressed: Software source code should define one or more target products that are the resulting software applications offering specific interfaces (The metadata does express this currently, but something is wrong in the way it is expressed. Is the type/class valid?)
VALIDATION https://webservices.cls.ru.nl/portal/asr_nl/0.6.2 #4: Warning: Documentation *SHOULD* be expressed (This is missing in the metadata)
VALIDATION https://webservices.cls.ru.nl/portal/asr_nl/0.6.2 #5: Info: Reference publications *SHOULD* be expressed, if any (This is missing in the metadata)
VALIDATION https://webservices.cls.ru.nl/portal/asr_nl/0.6.2 #6: Info: The funder *SHOULD* be acknowledged (This is missing in the metadata)
-- end log --
[harvester info] Output written to /tmp/out/asr_nl.codemeta.json
[harvester info] Harvesting remote service URL https://webservices.cls.ru.nl/asr_nl/ for asr_nl: codemetapy --baseuri https://webservices.cls.ru.nl/portal --baseuri https://webservices.cls.ru.nl/portal --includecontext --addcontext https://w3id.org/nwo-research-fields --addcontext https://w3id.org/research-technology-readiness-levels --addcontextgraph https://vocabs.dariah.eu/rest/v1/tadirah/data?format=text/turtle --trl -O "/tmp/codemeta-harvester.cache//tmp/asr_nl.codemeta.json" "/tmp/out/asr_nl.codemeta.json" "https://webservices.cls.ru.nl/asr_nl/"
-- begin log --
Passed 2 files/sources but specified 0 input types! Automatically guessing types...
Detected input types: [('/tmp/out/asr_nl.codemeta.json', 'json'), ('https://webservices.cls.ru.nl/asr_nl/', 'web')]
Adding to contextgraph: /tmp/turtle
Initial URI automatically generated, may be overriden later: https://webservices.cls.ru.nl/portal/asr-nl
Processing source #1 of 2
Parsing json-ld file from /tmp/out/asr_nl.codemeta.json
Found main resource with URI https://webservices.cls.ru.nl/portal/asr_nl/0.6.2
Injected (possibly temporary) URI https://webservices.cls.ru.nl/portal/asr-nl
[CODEMETA COMPOSITION (asr_nl)] processed 109 new triples, total is now 109
Processing source #2 of 2
Fallback: Obtaining metadata from remote URL https://webservices.cls.ru.nl/asr_nl/
Service replied with content-type application/ld+json
Parsing json...
Found main resource with URI https://webservices.cls.ru.nl/asr_nl
Injected (possibly temporary) URI https://webservices.cls.ru.nl/portal/webapplication/N99cf35b6a6a63b06780f6a079e8b881d
Adding service (targetProduct) https://webservices.cls.ru.nl/asr_nl/
[CODEMETA COMPOSITION (asr_nl)] processed 80 new triples, total is now 190
Remapping URI to (possibly) new identifier and version component: https://webservices.cls.ru.nl/portal/asr-nl -> https://webservices.cls.ru.nl/portal/asr_nl/0.6.2
[CODEMETA VALIDATION (asr_nl)] done
-- end log --
[harvester info] <-- Finished processing asr_nl (https://github.com/opensource-spraakherkenning-nl/asr_nl) [Sun Dec 22 04:01:04 UTC 2024]
""" .
a sdo:AudioObject ;
sdo:description "MP4 file" ;
sdo:encodingFormat "audio/mpeg" ;
sdo:identifier "MP4AudioFormat" ;
sdo:name "*.mp4" .
a sdo:Place ;
sdo:name "Nijmegen" .
a sdo:SoftwareApplication ;
sdo:identifier "clam" ;
sdo:name "CLAM" .
a sdo:AudioObject ;
sdo:description "Wav file" ;
sdo:encodingFormat "audio/vnd.wave" ;
sdo:identifier "WaveAudioFormat" ;
sdo:name "*.wav" .
a sdo:DigitalDocument ;
sdo:description "Automatic transcription of the input recording with timestamps (CTM) and speaker diarisation" ;
sdo:encodingFormat "text/plain" ;
sdo:identifier "CTMFormat" ;
sdo:name "*.ctm.spk" .
a sdo:DigitalDocument ;
sdo:description "Automatic transcription of the input recording" ;
sdo:encodingFormat "text/plain" ;
sdo:identifier "PlainTextFormat" ;
sdo:name "*.txt" .
rdf:first ;
rdf:rest () .
rdf:first ;
rdf:rest () .
a sdo:DigitalDocument ;
sdo:description "Automatic transcription of the input recording with timestamps (CTM)" ;
sdo:encodingFormat "text/plain" ;
sdo:identifier "CTMFormat" ;
sdo:name "*.ctm" .
a sdo:AudioObject ;
sdo:description "M4A file" ;
sdo:encodingFormat "audio/mpeg" ;
sdo:identifier "MP4AudioFormat" ;
sdo:name "*.m4a" .
a sdo:DigitalDocument ;
sdo:description "Automatic transcription of the input recording (full data) (AudioDoc XML)" ;
sdo:encodingFormat "text/xml" ;
sdo:identifier "XMLFormat" ;
sdo:name "*.xml" .
rdf:first ;
rdf:rest .
rdf:first "codemetapy validator using software.ttl" ;
rdf:rest () .
a sdo:SoftwareApplication ;
sdo:identifier "kaldi" ;
sdo:name "kaldi" .
rdf:first ;
rdf:rest () .
a sdo:Person ;
sdo:email "henk.vandenheuvel@ru.nl" ;
sdo:name "Emre Yilmaz, Maarten van Gompel" .
rdf:first ;
rdf:rest .
rdf:first ;
rdf:rest .
rdf:first ;
rdf:rest .
a sdo:AudioObject ;
sdo:description "Flac file" ;
sdo:encodingFormat "audio/flac" ;
sdo:identifier "FlacAudioFormat" ;
sdo:name "*.flac" .
a sdo:AudioObject ;
sdo:description "Ogg file" ;
sdo:encodingFormat "audio/vorbis" ;
sdo:identifier "OggAudioFormat" ;
sdo:name "*.ogg" .
a stype:WebApplication ;
sdo:name "Automatic Speech Recognition for Dutch" .
a sdo:DigitalDocument ;
sdo:description "Log file with (standard) error output" ;
sdo:encodingFormat "text/plain" ;
sdo:identifier "PlainTextFormat" ;
sdo:name "error.log" .
a sdo:Organization ;
sdo:name "Centre for Language and Speech Technology, Radboud University" .
a sdo:SoftwareApplication ;
sdo:identifier "kaldi_nl" ;
sdo:name "Kaldi_NL" .
a sdo:AudioObject ;
sdo:description "MP3 file" ;
sdo:encodingFormat "audio/mpeg" ;
sdo:identifier "MP3AudioFormat" ;
sdo:name "*.mp3" .
a sdo:Review ;
sdo:author ;
sdo:datePublished "2024-12-22 04:00:59"^^sdo:Date ;
sdo:name "Automatic software metadata validation report for Automatic Speech Recognition for Dutch 0.6.2" ;
sdo:reviewBody """Please consult the CLARIAH Software Metadata Requirements at https://github.com/CLARIAH/clariah-plus/blob/main/requirements/software-metadata-requirements.md for an in-depth explanation of any found problems
Validation of Automatic Speech Recognition for Dutch 0.6.2 was successful (score=3/5), but there are some warnings which should be addressed:
1. Warning: Software source code *SHOULD* link to a continuous integration service that builds the software and runs the software's tests (This is missing in the metadata)
2. Info: Software source code *MAY* express the programming language(s) used (This is missing in the metadata)
3. Info: An interface type *SHOULD* be expressed: Software source code should define one or more target products that are the resulting software applications offering specific interfaces (The metadata does express this currently, but something is wrong in the way it is expressed. Is the type/class valid?)
4. Warning: Documentation *SHOULD* be expressed (This is missing in the metadata)
5. Info: Reference publications *SHOULD* be expressed, if any (This is missing in the metadata)
6. Info: The funder *SHOULD* be acknowledged (This is missing in the metadata)""" ;
sdo:reviewRating 3 .
a sdo:WebApplication ;
sdo:author ;
sdo:description "This webservice uses automatic speech recognition to provide the transcriptions of recordings spoken in Dutch. You can upload and process only one file per project. For bulk processing and other questions, please contact Henk van den Heuvel at h.vandenheuvel@let.ru.nl." ;
sdo:name "Automatic Transcription of Dutch Speech Recordings" ;
sdo:provider ;
sdo:url ;
sdo:version "0.6.1" ;
iodata:consumesData ,
,
,
,
,
;
iodata:producesData ,
,
,
,
.
a skos:Concept ;
ns1:image "https://www.repostatus.org/badges/latest/active.svg" ;
skos:definition "The project has reached a stable, usable state and is being actively developed." ;
skos:inScheme "https://www.repostatus.org" ;
skos:prefLabel "Active" .
a sdo:Person ;
sdo:affiliation ;
sdo:email "emre.yilmaz@let.ru.nl" ;
sdo:familyName "Yılmaz" ;
sdo:givenName "Emre" .
a sdo:Person ;
sdo:affiliation ;
sdo:email "louis.tenbosch@ru.nl" ;
sdo:familyName "ten Bosch" ;
sdo:givenName "Louis" .
a sdo:Organization ;
sdo:location ;
sdo:name "Radboud University" ;
sdo:url .
a sdo:Organization ;
sdo:name "Centre for Language Studies" ;
sdo:parentOrganization ;
sdo:url .
a sdo:Person ;
sdo:affiliation ;
sdo:email "proycon@anaproy.nl" ;
sdo:familyName "van Gompel" ;
sdo:givenName "Maarten" .
skos:Concept a owl:Class .
a sdo:Organization ;
sdo:name "Centre for Language and Speech Technology" ;
sdo:parentOrganization ;
sdo:url .