Source code for dapla_metadata.variable_definitions.vardef

import logging
from datetime import date
from os import PathLike
from pathlib import Path

from dapla_metadata.variable_definitions._generated.vardef_client.api.data_migration_api import (
    DataMigrationApi,
)
from dapla_metadata.variable_definitions._generated.vardef_client.api.draft_variable_definitions_api import (
    DraftVariableDefinitionsApi,
)
from dapla_metadata.variable_definitions._generated.vardef_client.api.variable_definitions_api import (
    VariableDefinitionsApi,
)
from dapla_metadata.variable_definitions._generated.vardef_client.models.complete_response import (
    CompleteResponse,
)
from dapla_metadata.variable_definitions._generated.vardef_client.models.draft import (
    Draft,
)
from dapla_metadata.variable_definitions._generated.vardef_client.models.vardok_id_response import (
    VardokIdResponse,
)
from dapla_metadata.variable_definitions._utils._client import VardefClient
from dapla_metadata.variable_definitions._utils.template_files import (
    _find_latest_template_file,
)
from dapla_metadata.variable_definitions._utils.template_files import (
    create_template_yaml,
)
from dapla_metadata.variable_definitions._utils.variable_definition_files import (
    _read_file_to_model,
)
from dapla_metadata.variable_definitions.exceptions import VariableNotFoundError
from dapla_metadata.variable_definitions.exceptions import vardef_exception_handler
from dapla_metadata.variable_definitions.exceptions import vardef_file_error_handler
from dapla_metadata.variable_definitions.vardok_id import VardokId
from dapla_metadata.variable_definitions.vardok_vardef_id_pair import VardokVardefIdPair
from dapla_metadata.variable_definitions.variable_definition import VariableDefinition

logger = logging.getLogger(__name__)


[docs] class Vardef: """Create, maintain and read Variable Definitions. ==================== Variable Definitions ==================== Variable Definitions are centralized definitions of concrete variables which are typically present in multiple datasets. Variable Definitions support standardization of data and metadata and facilitate sharing and joining of data by clarifying when variables have an identical definition. The methods in this class allow for creation, maintenance and access of Variable Definitions. Creation and maintenance of variables may only be performed by Statistics Norway employees representing a specific Dapla team, who are defined as the owners of a given Variable Definition. The group a user represents is chosen when starting a service in Dapla Lab. This class will seamlessly detect this and send it to the API. All maintenance is to be performed by the owners, with no intervention from administrators. ====== Status ====== All Variable Definitions have an associated status. The possible values for status are `DRAFT`, `PUBLISHED_INTERNAL` and `PUBLISHED_EXTERNAL`. ----- Draft ----- When a Variable Definition is created it is assigned the status `DRAFT`. Under this status the Variable Definition is: * Only visible to Statistics Norway employees. * Mutable (it may be changed directly without need for versioning). * Not suitable to refer to from other systems. This status may be changed to `PUBLISHED_INTERNAL` or `PUBLISHED_EXTERNAL` with a direct update. ------------------ Published Internal ------------------ Under this status the Variable Definition is: * Only visible to Statistics Norway employees. * Immutable (all changes are versioned). * Suitable to refer to in internal systems for statistics production. * Not suitable to refer to for external use (for example in Statistikkbanken). This status may be changed to `PUBLISHED_EXTERNAL` by creating a Patch version. ------------------ Published External ------------------ Under this status the Variable Definition is: * Visible to the general public. * Immutable (all changes are versioned). * Suitable to refer to from any system. This status may not be changed as it would break immutability. If a Variable Definition is no longer relevant then its period of validity should be ended by specifying a `valid_until` date in a Patch version. ============ Immutability ============ Variable Definitions are immutable. This means that any changes must be performed in a strict versioning system. Consumers can avoid being exposed to breaking changes by specifying a `date_of_validity` when they request a Variable Definition. """
[docs] @classmethod @vardef_exception_handler def create_draft(cls, draft: Draft) -> VariableDefinition: """Create a Draft Variable Definition.""" new_variable = VariableDefinition.from_model( DraftVariableDefinitionsApi( VardefClient.get_client(), ).create_variable_definition( draft=draft, ), ) logger.info( "✅ Successfully created variable definition '%s' with ID '%s'", new_variable.short_name, new_variable.id, ) return new_variable
[docs] @classmethod @vardef_file_error_handler def create_draft_from_file( cls, file_path: PathLike[str] | None = None, ) -> VariableDefinition: """Create a Draft Variable Definition from a stored yaml file. By default the latest template file in the default directory is chosen, this may be overridden by providing a value for the optional `file_path` parameter. Args: file_path (PathLike[str], optional): Supply a file path to override the automatic one. Defaults to None. Raises: FileNotFoundError: When a file can't be found. Returns: VariableDefinition: The created draft variable definition. """ return cls.create_draft( _read_file_to_model( file_path or _find_latest_template_file(), Draft, ), )
[docs] @classmethod @vardef_exception_handler def migrate_from_vardok(cls, vardok_id: str) -> VariableDefinition: """Migrate a Variable Definition from Vardok to Vardef. - Each Vardok Variable Definition may only be migrated once. - The Dapla team of the person who performs the migration will be set as the owner. - All metadata should be checked for correctness before publication. Args: vardok_id (str): The ID of a Variable Definition in Vardok. Returns: VariableDefinition: The migrated Variable Definition in Vardef. """ migrated_variable = VariableDefinition.from_model( DataMigrationApi( VardefClient.get_client(), ).create_variable_definition_from_var_dok( vardok_id=vardok_id, ), ) logger.info( "✅ Successfully migrated variable definition '%s' with ID '%s'", migrated_variable.short_name, migrated_variable.id, ) return migrated_variable
[docs] @classmethod @vardef_exception_handler def list_vardok_vardef_mapping(cls) -> list[VardokVardefIdPair]: """List the mapping between vardok and vardef. Returns: List[VardokVardefIdPair]: The list with mappings between Vardok and Vardef """ return [ VardokVardefIdPair.from_model(definition) for definition in DataMigrationApi( VardefClient.get_client(), ).get_vardok_vardef_mapping() ]
[docs] @classmethod @vardef_exception_handler def get_variable_definition_by_vardok_id( cls, vardok_id: str, ) -> VariableDefinition: """Get a Variable Definition by its Vardok ID. Args: vardok_id (str): The Vardok ID of the desired Variable Definition Returns: VariableDefinition: The Variable Definition. Raises: TypeError: If the incorrect type is returned. """ raw_response = DataMigrationApi( VardefClient.get_client() ).get_vardok_vardef_mapping_by_id( vardok_id, ) if isinstance(raw_response.actual_instance, CompleteResponse): return VariableDefinition.from_model(raw_response.actual_instance) msg = "Unexpected response type" raise TypeError(msg)
[docs] @classmethod @vardef_exception_handler def get_vardok_id_by_short_name( cls, short_name: str, ) -> VardokId: """Retrieve a Vardok id by short name. Args: short_name (str): The short name of the desired Variable Definition Raises: TypeError: If the incorrect type is returned. """ variable_definition = cls.get_variable_definition_by_shortname(short_name) raw_response = DataMigrationApi( VardefClient.get_client() ).get_vardok_vardef_mapping_by_id( variable_definition.id, ) if isinstance(raw_response.actual_instance, VardokIdResponse): return VardokId.from_model(raw_response.actual_instance) msg = "Unexpected response type" raise TypeError(msg)
[docs] @classmethod @vardef_exception_handler def list_variable_definitions( cls, date_of_validity: date | None = None, ) -> list[VariableDefinition]: """List variable definitions. --------- Filtering --------- If no filter arguments are provided then all Variable Definitions are returned. See the documentation for the individual arguments to understand their effect. Filter arguments are combined with AND logic. Args: date_of_validity (date | None, optional): List only variable definitions which are valid on this date. Defaults to None. Returns: list[VariableDefinition]: The list of Variable Definitions. """ return [ VariableDefinition.from_model(definition) for definition in VariableDefinitionsApi( VardefClient.get_client(), ).list_variable_definitions( date_of_validity=date_of_validity, ) ]
[docs] @classmethod @vardef_exception_handler def get_variable_definition_by_id( cls, variable_definition_id: str, date_of_validity: date | None = None, ) -> VariableDefinition: """Get a Variable Definition by ID. Args: variable_definition_id (str): The ID of the desired Variable Definition date_of_validity (date | None, optional): List only variable definitions which are valid on this date. Defaults to None. Returns: VariableDefinition: The Variable Definition. Raises: NotFoundException when the given ID is not found """ return VariableDefinition.from_model( VariableDefinitionsApi( VardefClient.get_client(), ).get_variable_definition_by_id( variable_definition_id=variable_definition_id, date_of_validity=date_of_validity, ), )
[docs] @classmethod @vardef_exception_handler def get_variable_definition_by_shortname( cls, short_name: str, date_of_validity: date | None = None, ) -> VariableDefinition: """Retrieve a Variable Definition by short name. Args: short_name (str): The short name of the Variable Definition. date_of_validity (date | None, optional): Filter by validity date. Defaults to None. Returns: VariableDefinition: The retrieved Variable Definition. Raises: VariableNotFoundError: If no matching Variable Definition is found. ValueError: If multiple variables with the same shortname is found. """ client = VardefClient.get_client() api = VariableDefinitionsApi(client) variable_definitions = api.list_variable_definitions( short_name=short_name, date_of_validity=date_of_validity, ) if not variable_definitions: msg = f"Variable with short name {short_name} not found" raise VariableNotFoundError(msg) if len(variable_definitions) > 1: msg = f"Lookup by short name {short_name} found multiple variables which should not be possible." raise VariableNotFoundError(msg) return VariableDefinition.from_model(variable_definitions[0])
[docs] @classmethod @vardef_file_error_handler def write_template_to_file(cls, custom_file_path: str | None = None) -> Path: """Write template with default values to a yaml file.""" file_path = create_template_yaml( custom_directory=Path(custom_file_path) if custom_file_path else None, ) logger.info( f"✅ Created editable variable definition template file at {file_path}", # noqa: G004 ) return file_path
[docs] @classmethod @vardef_exception_handler def does_short_name_exist( cls, short_name: str, ) -> bool: """Return True if the short name exists in Vardef, otherwise False.""" variable_definitions = Vardef.list_variable_definitions() for variable in variable_definitions: if short_name.strip() == variable.short_name: logger.info( f"Found duplicate short name {short_name}", # noqa: G004 ) return True return False