Files
marka/registry/schema-org/StatisticalVariable.schema.json
Max Richter c687eff53d big tings
2025-08-17 15:16:17 +02:00

111 lines
7.3 KiB
JSON

{
"$schema": "https://json-schema.org/draft/2020-12/schema",
"$id": "schema:StatisticalVariable",
"title": "StatisticalVariable",
"description": "[[StatisticalVariable]] represents any type of statistical metric that can be measured at a place and time. The usage pattern for [[StatisticalVariable]] is typically expressed using [[Observation]] with an explicit [[populationType]], which is a type, typically drawn from Schema.org. Each [[StatisticalVariable]] is marked as a [[ConstraintNode]], meaning that some properties (those listed using [[constraintProperty]]) serve in this setting solely to define the statistical variable rather than literally describe a specific person, place or thing. For example, a [[StatisticalVariable]] Median_Height_Person_Female representing the median height of women, could be written as follows: the population type is [[Person]]; the measuredProperty [[height]]; the [[statType]] [[median]]; the [[gender]] [[Female]]. It is important to note that there are many kinds of scientific quantitative observation which are not fully, perfectly or unambiguously described following this pattern, or with solely Schema.org terminology. The approach taken here is designed to allow partial, incremental or minimal description of [[StatisticalVariable]]s, and the use of detailed sets of entity and property IDs from external repositories. The [[measurementMethod]], [[unitCode]] and [[unitText]] properties can also be used to clarify the specific nature and notation of an observed measurement. ",
"type": "object",
"allOf": [
{
"description": "The ConstraintNode type is provided to support usecases in which a node in a structured data graph is described with properties which appear to describe a single entity, but are being used in a situation where they serve a more abstract purpose. A [[ConstraintNode]] can be described using [[constraintProperty]] and [[numConstraints]]. These constraint properties can serve a\n variety of purposes, and their values may sometimes be understood to indicate sets of possible values rather than single, exact and specific values.",
"$ref": "schema:ConstraintNode"
}
],
"properties": {
"measuredProperty": {
"description": "The measuredProperty of an [[Observation]], typically via its [[StatisticalVariable]]. There are various kinds of applicable [[Property]]: a schema.org property, a property from other RDF-compatible systems, e.g. W3C RDF Data Cube, Data Commons, Wikidata, or schema.org extensions such as [GS1's](https://www.gs1.org/voc/?show=properties).",
"$ref": "schema:Property"
},
"measurementDenominator": {
"description": "Identifies the denominator variable when an observation represents a ratio or percentage.",
"oneOf": [
{ "$ref": "schema:StatisticalVariable" },
{ "type": "array", "items": { "$ref": "schema:StatisticalVariable" } }
]
},
"measurementMethod": {
"description": "A subproperty of [[measurementTechnique]] that can be used for specifying specific methods, in particular via [[MeasurementMethodEnum]].",
"oneOf": [
{
"anyOf": [
{ "type": "string", "format": "uri" },
{ "type": "string" },
{ "$ref": "schema:DefinedTerm" },
{ "$ref": "schema:MeasurementMethodEnum" }
]
},
{
"type": "array",
"items": {
"anyOf": [
{ "type": "string", "format": "uri" },
{ "type": "string" },
{ "$ref": "schema:DefinedTerm" },
{ "$ref": "schema:MeasurementMethodEnum" }
]
}
}
]
},
"measurementQualifier": {
"description": "Provides additional qualification to an observation. For example, a GDP observation measures the Nominal value.",
"oneOf": [
{ "$ref": "schema:Enumeration" },
{ "type": "array", "items": { "$ref": "schema:Enumeration" } }
]
},
"measurementTechnique": {
"description": "A technique, method or technology used in an [[Observation]], [[StatisticalVariable]] or [[Dataset]] (or [[DataDownload]], [[DataCatalog]]), corresponding to the method used for measuring the corresponding variable(s) (for datasets, described using [[variableMeasured]]; for [[Observation]], a [[StatisticalVariable]]). Often but not necessarily each [[variableMeasured]] will have an explicit representation as (or mapping to) an property such as those defined in Schema.org, or other RDF vocabularies and \"knowledge graphs\". In that case the subproperty of [[variableMeasured]] called [[measuredProperty]] is applicable.\n \nThe [[measurementTechnique]] property helps when extra clarification is needed about how a [[measuredProperty]] was measured. This is oriented towards scientific and scholarly dataset publication but may have broader applicability; it is not intended as a full representation of measurement, but can often serve as a high level summary for dataset discovery. \n\nFor example, if [[variableMeasured]] is: molecule concentration, [[measurementTechnique]] could be: \"mass spectrometry\" or \"nmr spectroscopy\" or \"colorimetry\" or \"immunofluorescence\". If the [[variableMeasured]] is \"depression rating\", the [[measurementTechnique]] could be \"Zung Scale\" or \"HAM-D\" or \"Beck Depression Inventory\". \n\nIf there are several [[variableMeasured]] properties recorded for some given data object, use a [[PropertyValue]] for each [[variableMeasured]] and attach the corresponding [[measurementTechnique]]. The value can also be from an enumeration, organized as a [[MeasurementMetholdEnumeration]].",
"oneOf": [
{
"anyOf": [
{ "type": "string", "format": "uri" },
{ "type": "string" },
{ "$ref": "schema:DefinedTerm" },
{ "$ref": "schema:MeasurementMethodEnum" }
]
},
{
"type": "array",
"items": {
"anyOf": [
{ "type": "string", "format": "uri" },
{ "type": "string" },
{ "$ref": "schema:DefinedTerm" },
{ "$ref": "schema:MeasurementMethodEnum" }
]
}
}
]
},
"populationType": {
"description": "Indicates the populationType common to all members of a [[StatisticalPopulation]] or all cases within the scope of a [[StatisticalVariable]].",
"oneOf": [
{ "$ref": "schema:Class" },
{ "type": "array", "items": { "$ref": "schema:Class" } }
]
},
"statType": {
"description": "Indicates the kind of statistic represented by a [[StatisticalVariable]], e.g. mean, count etc. The value of statType is a property, either from within Schema.org (e.g. [[median]], [[marginOfError]], [[maxValue]], [[minValue]]) or from other compatible (e.g. RDF) systems such as DataCommons.org or Wikidata.org. ",
"oneOf": [
{
"anyOf": [
{ "type": "string", "format": "uri" },
{ "type": "string" },
{ "$ref": "schema:Property" }
]
},
{
"type": "array",
"items": {
"anyOf": [
{ "type": "string", "format": "uri" },
{ "type": "string" },
{ "$ref": "schema:Property" }
]
}
}
]
}
}
}