Our data schema not only addresses the actual links between publications and research data, but also contains the process model to obtain these links by executing algorithms by means of our services. A higher-level description of the schema is provided here.

 / schema / [text/turtle]

@base <http://infolis.gesis.org/infolink/schema/> .
@prefix rdf: <http://www.w3.org/1999/02/22-rdf-syntax-ns#> .
@prefix foaf: <http://xmlns.com/foaf/0.1/> .
@prefix dc: <http://purl.org/dc/elements/1.1/> .
@prefix owl: <http://www.w3.org/2002/07/owl#> .
@prefix rdfs: <http://www.w3.org/2000/01/rdf-schema#> .
@prefix skos: <http://www.w3.org/2004/02/skos/core#> .
@prefix xsd: <http://www.w3.org/2001/XMLSchema#> .
@prefix dcterms: <http://purl.org/dc/terms/> .
@prefix schema: <http://schema.org/> .
@prefix bibo: <http://purl.org/ontology/bibo/> .
@prefix infolis: <> .
@prefix dqm: <http://purl.org/dqm-vocabulary/v1/dqm#> .
@prefix omnom: <http://onto.dm2e.eu/schema/omnom/> .
@prefix doap: <http://usefulinc.com/ns/doap#> .
@prefix vann: <http://purl.org/vocab/vann/> .

<>
    dc:description "This ontology is the normative source for the semantics and structure of the domain of the InFoLiS project" ;
    dc:title "Infolis Data model" ;
    dcterms:modified "2015-12-02T13:53:09+0100"^^xsd:datetime ;
    doap:implements <https://github.com/infolis/infoLink> ;
    a doap:Project ;
    rdfs:seeAlso <https://github.com/infolis>, <https://github.com/infolis/express-jsonld>, <https://github.com/infolis/infoLink>, <https://github.com/infolis/infolis-datasets>, <https://github.com/infolis/infolis-logging>, <https://github.com/infolis/infolis-web>, <https://github.com/infolis/jsonld-rapper>, <https://github.com/infolis/mongoose-jsonld>, <https://github.com/kba/jsonld-common-contexts>, <https://github.com/kba/node-vim2html>, <https://github.com/kba/turtleson> .

infolis:Entity
    dc:description "An entity to be linked from or to, i.e. a dataset or a publication" ;
    a owl:Class, owl:Thing .

infolis:EntityLink
    dc:description """An entity link describes that two entities are linked, i.e. a publication is linked to the research data that is mentioned in
the publication text""" ;
    a owl:Class, owl:Thing .

infolis:Execution
    dc:description "The concrete execution of an Algorithm." ;
    dcterms:source <https://github.com/infolis/infoLink/blob/master/src/main/java/io/github/infolis/model/Execution.java> ;
    vann:example <../api#!/rest-ld-execution> ;
    a owl:Class, owl:Thing ;
    rdfs:subClassOf schema:Action .

infolis:InfolisFile
    dc:description "A resource representing a file on the server." ;
    a owl:Class, owl:Thing ;
    owl:sameAs <http://onto.dm2e.eu/omnom/File> .

infolis:InfolisPattern
    dc:description "A Regular Expression pattern" ;
    a owl:Class, owl:Thing .

infolis:Keyword
    dc:description "Keywords indicate the topics of entities. They are generated by searching terms of a thesaurus in the abstract." ;
    a owl:Class, owl:Thing .

infolis:QueryService
    dc:description "A query service" ;
    a owl:Class, owl:Thing .

infolis:SearchQuery
    dc:description "A search query" ;
    vann:example <../api#!/rest-ld-searchQuery> ;
    a owl:Class, owl:Thing .

infolis:SearchResult
    dc:description "A search result" ;
    a owl:Class, owl:Thing ;
    rdfs:subClassOf infolis:Entity .

infolis:TextualReference
    dc:description "Class for saving contexts (= surrounding words of a term)." ;
    a owl:Class, owl:Thing .

infolis:abstractLanguage
    dc:description "Language of the abstracts" ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range [
        a rdfs:Datatype ;
        owl:oneOf ("en"
            "de"
        )
    ] .

infolis:abstractText
    dc:description "The description of an entity which has been expressed in an abstract" ;
    schema:domainIncludes infolis:Entity ;
    rdfs:range xsd:string ;
    owl:sameAs dc:abstract .

infolis:algorithm
    dc:description "Java class of the algorithm which is supposed to be executed within this execution." ;
    dcterms:source <https://github.com/infolis/infoLink/blob/master/src/main/java/io/github/infolis/model/Execution.java> ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range [
        a rdfs:Datatype ;
        owl:oneOf ("# TODO fix this for updated version"
            "io.github.infolis.algorithm.BestMatchLinker"
            "io.github.infolis.algorithm.BibliographyExtractor"
            "io.github.infolis.algorithm.DoiExtractor"
            "io.github.infolis.algorithm.DoiLinker"
            "io.github.infolis.algorithm.FederatedSearcher"
            "io.github.infolis.algorithm.FrequencyBasedBootstrapping"
            "io.github.infolis.algorithm.GoldLinker"
            "io.github.infolis.algorithm.Indexer"
            "io.github.infolis.algorithm.InfolisPatternSearcher"
            "io.github.infolis.algorithm.KeywordTagger"
            "io.github.infolis.algorithm.LearnPatternsAndCreateLinks"
            "io.github.infolis.algorithm.Learner"
            "io.github.infolis.algorithm.LinkImporter"
            "io.github.infolis.algorithm.LocalSearcher"
            "io.github.infolis.algorithm.LuceneSearcher"
            "io.github.infolis.algorithm.MetaDataExtractor"
            "io.github.infolis.algorithm.MultiMatchesLinker"
            "io.github.infolis.algorithm.OntologyLinker"
            "io.github.infolis.algorithm.ReferenceLinker"
            "io.github.infolis.algorithm.RegexSearcher"
            "io.github.infolis.algorithm.ReliabilityBasedBootstrapping"
            "io.github.infolis.algorithm.SearchPatternsAndCreateLinks"
            "io.github.infolis.algorithm.SearchDoisAndCreateLinks"
            "io.github.infolis.algorithm.SearchResultLinker"
            "io.github.infolis.algorithm.SpringerImporter"
            "io.github.infolis.algorithm.TagSearcher"
            "io.github.infolis.algorithm.TextAndMetaDataExtractor"
            "io.github.infolis.algorithm.TextExtractor"
            "io.github.infolis.algorithm.NameExtractor"
            "io.github.infolis.algorithm.Tokenizer"
            "io.github.infolis.algorithm.TokenizerOpenNLP"
            "io.github.infolis.algorithm.TokenizerStanford"
            "org.gesis.git.LODInfrastructure.dataProcessing.importer.AllbusBibImporter"
            "org.gesis.git.LODInfrastructure.dataProcessing.importer.DbkImporter"
            "org.gesis.git.LODInfrastructure.dataProcessing.importer.ZisImporter"
            "org.gesis.git.LODInfrastructure.dataProcessing.enrichment.DatasetSearcher"
        )
    ] .

infolis:allowLeadingWildcards
    dc:description """Determines whether the Lucene query parser is allowed to
use leading wildcard characters.
Default: true""" ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:boolean .

infolis:authors
    dc:description "List of authors who created the entity" ;
    schema:domainIncludes infolis:Entity ;
    rdfs:range xsd:string ;
    owl:sameAs dc:creator .

infolis:bootstrapStrategy
    dc:description "Strategy to use for bootstrapping. Can either be: mergeCurrent, mergeNew, mergeAll, separate, reliability." ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range [
        a rdfs:Datatype ;
        owl:oneOf ("mergeCurrent"
            "mergeNew"
            "mergeAll"
            "separate"
            "reliability"
        )
    ] .

infolis:confidence
    dc:description "Describes how likely it is that the link indeed holds, xsd:double" ;
    schema:domainIncludes infolis:EntityLink ;
    rdfs:range xsd:float .

infolis:confidenceScore
    dc:description "The confidence score of a keyword bases on the similarity of the terms in the abstract to the terms in the thesaurus." ;
    schema:domainIncludes infolis:Keyword ;
    rdfs:range xsd:float .

infolis:date
    dc:description "Date of the search resul" ;
    schema:domainIncludes infolis:SearchResult ;
    rdfs:range xsd:string .

infolis:endTime
    dc:description "Timestamp when execution ended." ;
    schema:domainIncludes infolis:Execution ;
    a xsd:date ;
    rdfs:range xsd:dateTime ;
    owl:sameAs schema:endTime .

infolis:entitiesForKeywordTagging
    dc:description """List of entities (URIs of the entities) for which key words should be
generated. Serves as input for the keyword  tagging algorithm.""" ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range infolis:Entity .

infolis:entityRelations
    dc:description "Type of the relation that holds between fromEntity and toEntity" ;
    schema:domainIncludes infolis:EntityLink ;
    rdfs:range [
        a rdfs:Datatype ;
        owl:oneOf ("part_of_temporal"
            "part_of_spatial"
            "superset_of_temporal"
            "superset_of_spatial"
            "parts_of_temporal"
            "parts_of_spatial"
            "version_of"
            "superset_of_version"
            "part_of_confidential"
            "superset_of_confidential"
            "part_of_sample"
            "superset_of_sample"
            "part_of_supplement"
            "superset_of_supplement"
            "part_of"
            "parts_of"
            "superset_of"
            "same_as_temporal"
            "same_as_spatial"
            "superset_of_translation"
            "part_of_translation"
            "part_of_methodical"
            "parts_of_methodical"
            "superset_of_methodical"
            "unknown"
            "same_as"
            "references"
        )
    ] ;
    owl:sameAs dc:relation .

infolis:entityReliability
    dc:description "Confidence value for this entity; less than 1 for automatically generated entities" ;
    schema:domainIncludes infolis:Entity ;
    rdfs:range xsd:float .

infolis:entityType
    dc:description "The type of entity: publication, dataset, database, citedData, project, institution or instrument" ;
    schema:domainIncludes infolis:Entity ;
    rdfs:range [
        a rdfs:Datatype ;
        owl:oneOf ("publication"
            "dataset"
            "database"
            "citedData"
            "project"
            "institution"
            "instrument"
        )
    ] .

infolis:entityView
    dc:description "View to display for this entity (e.g. a citation string)" ;
    schema:domainIncludes infolis:Entity ;
    rdfs:range xsd:string .

infolis:fileName
    dc:description "The name of a file in the senseof what the `basename(1)` would return." ;
    schema:domainIncludes infolis:InfolisFile ;
    rdfs:range xsd:string ;
    owl:sameAs <http://onto.dm2e.eu/omnom/fileName> .

infolis:fileStatus
    dc:description "The status of the bytestream of a file on the server, indicating whether it is still there or has been deleted" ;
    schema:domainIncludes infolis:InfolisFile ;
    rdfs:range [
        a rdfs:Datatype ;
        owl:oneOf ("AVAILABLE"
            "DELETED"
        )
    ] ;
    owl:sameAs <http://onto.dm2e.eu/omnom/fileStatus> .

infolis:fromEntity
    dc:description "The entity from which the link originates from, this is typically the publication" ;
    schema:domainIncludes infolis:EntityLink ;
    rdfs:range infolis:Entity .

infolis:identifier
    dc:description "Identifiers of the search result" ;
    schema:domainIncludes infolis:SearchResult ;
    rdfs:range xsd:string .

infolis:identifiers
    dc:description "Identifiers of the entity" ;
    schema:domainIncludes infolis:Entity ;
    rdfs:range xsd:string .

infolis:indexDirectory
    dc:description "index directory of the indexer." ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:string .

infolis:infolisFileTags
    dc:description "List of tags to identify a specific set of InfolisFiles" ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:string .

infolis:infolisPatternTags
    dc:description "List of tags to identify a specific set of InfolisPatterns" ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:string .

infolis:inputFiles
    dc:description """List of URIs of input files.
Can be either PDF or text files.
They are for example used to search patterns within the Pattern Applier algorithm.""" ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range infolis:InfolisFile .

infolis:keyWords
    dc:description "Key words which are generated by the KeywordTagger." ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:string .

infolis:language
    schema:domainIncludes infolis:Entity ;
    rdfs:range xsd:string ;
    owl:sameAs dc:language .

infolis:leftContextGroup
    dc:description "Group numbers to use for RegexSearcher: group of left context." ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:float .

infolis:leftText
    dc:description "Text left of the term" ;
    schema:domainIncludes infolis:TextualReference ;
    rdfs:range xsd:string .

infolis:linkReason
    dc:description """The TextualReference found in the fromEntity based on which a 
link to the toEntity was established""" ;
    schema:domainIncludes infolis:EntityLink ;
    rdfs:range xsd:string .

infolis:linkView
    dc:description "View to display for this link" ;
    schema:domainIncludes infolis:EntityLink ;
    rdfs:range xsd:string .

infolis:linkedEntities
    dc:description """Beside the search in external repositories, we can also
search in our own database. As use case, we get a URN for a publication
from a user and want to show all named entities that are linked to 
this publication. With an internal search using the generated links,
we can find these entities which are returned in this list.""" ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range infolis:Entity .

infolis:links
    dc:description """As a final step, links between the texts and the discovered
named entities (research data) are established and saved in this list.""" ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range infolis:EntityLink .

infolis:listIndex
    dc:description "Position in the list of search results" ;
    schema:domainIncludes infolis:SearchResult ;
    rdfs:range xsd:float .

infolis:log
    dc:description "Log messages of this execution." ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:string .

infolis:luceneQuery
    dc:description "The Lucene query that can be used to query an index" ;
    schema:domainIncludes infolis:InfolisPattern ;
    rdfs:range xsd:string .

infolis:manifestsEntity
    dc:description "The Entity this Infolisfile manifests" ;
    schema:domainIncludes infolis:InfolisFile ;
    rdfs:range infolis:Entity .

infolis:maxClauseCount
    dc:description """The  maximum number of clauses permitted per BooleanQuery (Lucence search).
A boolean query represents a query that matches documents
matching boolean combinations of other queries.
Default: Integer max value""" ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:float .

infolis:maxIterations
    dc:description """Maximum number of iterations during the bootstrapping process.
A high number of iterations can lead to a increased run time.
Default: 10""" ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:float .

infolis:maxNumber
    dc:description "Maximum number of results" ;
    schema:domainIncludes infolis:QueryService ;
    rdfs:range xsd:float .

infolis:md5
    dc:description "MD5 checksum" ;
    schema:domainIncludes infolis:InfolisFile ;
    a xsd:string ;
    rdfs:range xsd:string ;
    owl:sameAs <http://onto.dm2e.eu/omnom/md5> .

infolis:mediaType
    dc:description "The IANA media type of this file" ;
    schema:domainIncludes infolis:InfolisFile ;
    rdfs:range [
        a rdfs:Datatype ;
        owl:oneOf ("application/pdf"
            "text/plain"
        )
    ] ;
    owl:sameAs <http://www.w3.org/ns/dcat#mediaType> .

infolis:mentionsReference
    dc:description "Entity that contains this textual reference" ;
    schema:domainIncludes infolis:TextualReference ;
    rdfs:range infolis:Entity .

infolis:metaDataFiles
    dc:description """Meta data files of the publications in which information about
the title, author, astract, subject, identifiers, URL, and language
can be found.""" ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:string .

infolis:name
    dc:description "Name of the entity" ;
    schema:domainIncludes infolis:Entity ;
    rdfs:range xsd:string .

infolis:numericInfo
    dc:description "Numeric information belonging to the entity, e.g. temporal coverage or publication date" ;
    schema:domainIncludes infolis:Entity ;
    rdfs:range xsd:string .

infolis:numericInformation
    dc:description "Any kind of numeric information that we can extract from a search result, e.g. years, versions etc." ;
    schema:domainIncludes infolis:SearchResult ;
    rdfs:range xsd:string .

infolis:outputDirectory
    dc:description "Output directory of the indexer." ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:string .

infolis:outputFiles
    dc:description "List of URIs of output files. Output files to save the output files (txt files) of algorithms." ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range infolis:InfolisFile .

infolis:overwriteTextFiles
    dc:description """Flag used by TextExtractor: if set to false, pdfs for which corresponding text 
files already exist in the specified text directory will not be converted again, instead 
the existing text files will be returned as InfolisFile instances. If set to true, all 
pdfs will be converted regardless of any existing files in the text directory. """ ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:boolean .

infolis:pattern
    dc:description "Pattern that extracted this textual reference" ;
    schema:domainIncludes infolis:TextualReference ;
    rdfs:range infolis:InfolisPattern .

infolis:patternRegex
    dc:description "A string containing a Java Regular Expression pattern" ;
    schema:domainIncludes infolis:InfolisPattern ;
    rdfs:range xsd:string ;
    owl:sameAs dqm:regex .

infolis:patternReliability
    dc:description "Confidence value for this pattern; less than 1 for automatically generated patterns" ;
    schema:domainIncludes infolis:InfolisPattern ;
    rdfs:range xsd:float .

infolis:patterns
    dc:description """A list of patterns (internally expressed as regular expression)
that can be applied on texts, e.g. to find links to research data.""" ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range infolis:InfolisFile .

infolis:phraseSlop
    dc:description """The slop for phrases used by the Lucene query parser.
It determines how similar two phrases must be to be matched.
If zero, then only exact phrase matches, if 10 up to 10 edit
operations may be carried out.
Default: 10""" ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:float .

infolis:progress
    dc:description "Numerical progress of the execution in the interval 0-100." ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:float .

infolis:provenance
    dc:description "Source of the link" ;
    schema:domainIncludes infolis:EntityLink ;
    rdfs:range xsd:string .

infolis:ptb3Escaping
    dc:description "Enable all traditional PTB3 token transforms (like parentheses becoming -LRB-, -RRB-)." ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:boolean .

infolis:query
    dc:description "The query string" ;
    schema:domainIncludes infolis:SearchQuery ;
    rdfs:range xsd:string .

infolis:queryService
    dc:description "Query Service used to retrieve search result." ;
    schema:domainIncludes infolis:SearchResult ;
    rdfs:range xsd:string .

infolis:queryServiceClasses
    dc:description "Instead of a using a list of QueryService URIs(queryServices), the Java classes of the QueryServices can be used. This way, the query serivces do not need to be posted." ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range [
        a rdfs:Datatype ;
        owl:oneOf ("io.github.infolis.infolink.querying.DaraHTMLQueryService"
            "io.github.infolis.infolink.querying.DaraSolrQueryService"
            "io.github.infolis.infolink.querying.DataciteQueryService"
        )
    ] .

infolis:queryServiceType
    dc:description "Service for searching entities in a repository." ;
    schema:domainIncludes infolis:QueryService ;
    rdfs:range [
        a rdfs:Datatype ;
        owl:oneOf ("io.github.infolis.infolink.querying.DaraHTMLQueryService"
            "io.github.infolis.infolink.querying.DaraSolrQueryService"
            "io.github.infolis.infolink.querying.DataciteQueryService"
        )
    ] .

infolis:queryServices
    dc:description "List of QueryService to use. A query service to a certain repository can be posted and later referred." ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range infolis:QueryService .

infolis:queryStrategy
    dc:description "Fields that can be used in a query." ;
    schema:domainIncludes infolis:QueryService ;
    rdfs:range [
        a rdfs:Datatype ;
        owl:oneOf ("title"
            "publicationDate"
            "numericInfoInTitle"
            "doi"
        )
    ] .

infolis:reference
    dc:description "The term" ;
    schema:domainIncludes infolis:TextualReference ;
    rdfs:range xsd:string .

infolis:referenceGroup
    dc:description """Group numbers to use for RegexSearcher: group of reference term.
number of the group which contains the doi. This number depends on the used doiRegex""" ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:float .

infolis:referenceReliability
    dc:description "Confidence value for this textual reference; less than 1 for automatically generated references" ;
    schema:domainIncludes infolis:TextualReference ;
    rdfs:range xsd:float .

infolis:referredEntity
    dc:description "Refers to the entity to which the keyword has been assigned." ;
    schema:domainIncludes infolis:Keyword ;
    rdfs:range infolis:Entity .

infolis:relevanceScore
    dc:description "Relevance score as calculated by the search engine" ;
    schema:domainIncludes infolis:SearchResult ;
    rdfs:range xsd:float .

infolis:reliabilityThreshold
    dc:description "Determines which patterns are the relevant ones." ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:float .

infolis:removeBib
    dc:description "Whether to remove the bibliography from text/plain document." ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:boolean .

infolis:rightContextGroup
    dc:description "Group numbers to use for RegexSearcher: group of right context." ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:float .

infolis:rightText
    dc:description "Text right of the term" ;
    schema:domainIncludes infolis:TextualReference ;
    rdfs:range xsd:string .

infolis:searchQuery
    dc:description """Any kind of search query that can be used within the algorithms.
For example, it represtens the search query which is used
to perform a search in different repositories to find
fitting research data.""" ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range infolis:SearchQuery .

infolis:searchResultLinkerClass
    dc:description """The SearchResultLinkerClass determines the SearchResultLinker to 
use. That class is responsible for deciding which SearchResults to 
select for creating links.""" ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range [
        a rdfs:Datatype ;
        owl:oneOf ("io.github.infolis.algorithm.BestMatchLinker"
            "io.github.infolis.algorithm.MultiMatchesLinker"
            "io.github.infolis.algorithm.OntologyLinker"
            "io.github.infolis.algorithm.GoldLinker"
        )
    ] .

infolis:searchResults
    dc:description """After a search in one or more repositories, a list 
of search results is returned. These results not only contain
the repository which was searched but also information like
the relevance score.""" ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range infolis:SearchResult .

infolis:searchTerm
    dc:description """A search term that can be used in different algorithms whenever
something a certain term needs to be searched in a text.
For example, the bootstrapping algorithms need a seed in the beginning to start
the whole process. The search term represents such a seed, e.g. the study name 'ALLBUS'.""" ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:string .

infolis:seeds
    dc:description "The initial seeds for learning." ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:string .

infolis:serviceReliability
    dc:description "The reliability of this QueryService" ;
    schema:domainIncludes infolis:QueryService ;
    rdfs:range xsd:float .

infolis:spatial
    schema:domainIncludes infolis:Entity ;
    rdfs:range xsd:string ;
    owl:sameAs dcterms:spatial .

infolis:startPage
    dc:description """Index (starting at 1 rather than 0) of the first page to extract. 
Useful to ignore title pages if present.""" ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:float .

infolis:startTime
    dc:description "Timestamp when execution started." ;
    schema:domainIncludes infolis:Execution ;
    a xsd:date ;
    rdfs:range xsd:dateTime ;
    owl:sameAs schema:startTime .

infolis:status
    dc:description """Status of the execution

* PENDING
* STARTED
* FINISHED
* FAILED

Default (when starting): ExecutionStatus.PENDING""" ;
    vann:example "SUCCESS" ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range [
        a rdfs:Datatype ;
        owl:oneOf ("PENDING"
            "STARTED"
            "FAILED"
            "FINISHED"
        )
    ] .

infolis:subjects
    dc:description "List of subjects which are assigned to an entity, this can either be free text keywords or keywords from a controlled vocabulary" ;
    schema:domainIncludes infolis:Entity ;
    rdfs:range xsd:string ;
    owl:sameAs dc:subject .

infolis:tags
    dc:description "A set of free form tags attached to this file", """Free-form tags to assign to the execution and all generated entities. 
This makes all uploaded and generated data identifiable and searchable 
e.g. using infolisFileTags, infolisPatternTags and textualReferenceTags. """, "Tags assigned to this entity", "Tags assigned to this entityLink", "Tags assigned to this keyword", "Tags assigned to this pattern", "Tags assigned to this query service", "Tags assigned to this search result", "Tags assigned to this textual reference" ;
    schema:domainIncludes infolis:Entity, infolis:EntityLink, infolis:Execution, infolis:InfolisFile, infolis:InfolisPattern, infolis:Keyword, infolis:QueryService, infolis:SearchResult, infolis:TextualReference ;
    rdfs:range xsd:string ;
    owl:sameAs dc:subject .

infolis:target
    dc:description "The target of this QueryService, in most cases a URI" ;
    schema:domainIncludes infolis:QueryService ;
    rdfs:range xsd:anyURI .

infolis:textFile
    dc:description "The file this reference came from" ;
    schema:domainIncludes infolis:TextualReference ;
    rdfs:range infolis:InfolisFile .

infolis:textualReferenceTags
    dc:description "List of tags to identify a specific set of TextualReferences" ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:string .

infolis:textualReferences
    dc:description """A textual reference represents any kind of reference that
can be find in a text, e.g. a term like a study name has been found in a publication.
Besides the text and the term that has been found in the text,
it also contains the context, i.e. where the term has been detected.""", "TODO remove" ;
    schema:domainIncludes infolis:Entity, infolis:Execution ;
    rdfs:range infolis:TextualReference .

infolis:thesaurus
    dc:description "Path/URI to the thesaurus which is used for the key word tagging." ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:string .

infolis:thesaurusLabel
    dc:description "Label of the keyword in the thesaurus." ;
    schema:domainIncludes infolis:Keyword ;
    rdfs:range xsd:string .

infolis:thesaurusURI
    dc:description "URI of the keyword in the thesaurus." ;
    schema:domainIncludes infolis:Keyword ;
    rdfs:range xsd:string .

infolis:threshold
    dc:description "Threshold which is applied to only filter relevant patterns" ;
    schema:domainIncludes infolis:InfolisPattern ;
    rdfs:range xsd:float .

infolis:titles
    dc:description "All titles that have been found as names, can also be from different lanuages" ;
    schema:domainIncludes infolis:SearchResult ;
    rdfs:range xsd:string .

infolis:toEntity
    dc:description "The entity to which is linked, this is typically the research data" ;
    schema:domainIncludes infolis:EntityLink ;
    rdfs:range infolis:Entity .

infolis:tokenize
    dc:description """Whether to tokenize text input.

Bootstrapping requires tokenized input texts to perform well. It can
either be called on tokenized input texts or it can be called on
untokenized text or pdf files and perform tokenization itself. If
unspecified, defaults to false for TextExtractor. For Bootstrapping,
this field has to be set explicitly as this information is crucial for
good performance.""" ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:boolean .

infolis:tokenizeNLs
    dc:description "Determines whether new line characters are to be tokenized." ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:boolean .

infolis:upperCaseConstraint
    dc:description """Indicates whether we require a term to contain at least one upper case
character.

The idea behind is that especially a study name is supposed to be a
named entity and thus should contain at least one upper-case character.
Default: false""" ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:boolean .

infolis:url
    dc:description "URL describing the entity or offering supplemental material" ;
    schema:domainIncludes infolis:Entity ;
    rdfs:range xsd:string .

infolis:versionInfo
    dc:description "Version of a datafile" ;
    schema:domainIncludes infolis:Entity ;
    rdfs:range xsd:string ;
    owl:sameAs owl:versionInfo .

infolis:windowsize
    dc:description "Number of words used for creation of patterns." ;
    schema:domainIncludes infolis:Execution ;
    rdfs:range xsd:float .

<https://github.com/infolis>
    doap:shortdesc "Github organization containing all the software developed by InFoLiS" ;
    a doap:Project .

<https://github.com/infolis/express-jsonld>
    dcterms:requires <https://github.com/infolis/infolis-logging>, <https://github.com/infolis/jsonld-rapper> ;
    doap:programming-language "CoffeeScript" ;
    doap:shortdesc "JSON-LD content-negotiating middleware for Express based on node-jsonld and rapper" ;
    a doap:Project .

<https://github.com/infolis/infoLink>
    doap:programming-language "Java" ;
    doap:shortdesc "The software implementing all the algorithms, doing the text mining, linking the entities and much more" ;
    a doap:Project .

<https://github.com/infolis/infolis-datasets>
    doap:programming-language "Python" ;
    doap:shortdesc "Project containing all the data and tools to run learning and linking in bulk in a Linux environment." ;
    a doap:Project .

<https://github.com/infolis/infolis-logging>
    doap:programming-language "JavaScript" ;
    doap:shortdesc "Module-specific Winston logging" ;
    a doap:Project .

<https://github.com/infolis/infolis-web>
    dcterms:requires <https://github.com/infolis/express-jsonld>, <https://github.com/infolis/infolis-logging>, <https://github.com/infolis/mongoose-jsonld>, <https://github.com/kba/node-vim2html>, <https://github.com/kba/turtleson> ;
    doap:implements <> ;
    doap:programming-language "Javascript" ;
    doap:shortdesc "Project that implements the HTTP-based RESTful Linked Data infrastructure for InFoLiS" ;
    a doap:Project .

<https://github.com/infolis/jsonld-rapper>
    dcterms:requires <https://github.com/infolis/infolis-logging>, <https://github.com/kba/jsonld-common-contexts> ;
    doap:programming-language "CoffeeScript" ;
    doap:shortdesc "Convert between RDF and JSON-LD using rapper" ;
    a doap:Project .

<https://github.com/infolis/mongoose-jsonld>
    dcterms:requires <https://github.com/infolis/express-jsonld>, <https://github.com/infolis/infolis-logging>, <https://github.com/infolis/jsonld-rapper>, <https://github.com/kba/jsonld-common-contexts>, <https://github.com/kba/turtleson> ;
    doap:programming-language "CoffeeScript" ;
    doap:shortdesc "Add JSON-LD context to a Mongoose schema" ;
    a doap:Project .

<https://github.com/kba/jsonld-common-contexts>
    doap:programming-language "JavaScript" ;
    doap:shortdesc "Cached versions of commonly used namespaces" ;
    a doap:Project .

<https://github.com/kba/node-vim2html>
    doap:programming-language "Makefile" ;
    doap:shortdesc "Create HTML highlighted by Vim`s 2html script" ;
    a doap:Project .

<https://github.com/kba/turtleson>
    doap:programming-language "JavaScript" ;
    doap:shortdesc "Concise, permissive, TURTLE-like dialect of JSON" ;
    a doap:Project .