Source code for esrf_ontologies.technique.types
import dataclasses
import logging
from typing import Dict
from typing import List
from typing import MutableMapping
from typing import Optional
from typing import Set
from typing import Tuple
from typing import Union
_logger = logging.getLogger(__name__)
[docs]
@dataclasses.dataclass(frozen=True)
class Technique:
"""Technique defined in an Ontology"""
iri: str # Internationalized Resource Identifier
names: Tuple[str] # Human readable name (first is the perferred one)
description: str # Human readable description
ontology_version: str # Ontology version extracted from OWL
versioned_iri: str # Versioned IRI derived from stable IRI and ontology version
@property
def primary_name(self) -> str:
return self.names[0]
BLISS_SCANINFO_CATEGORY = ""
_NEXUS_IDENTIFIER_PREFIX = "identifier_technique_"
[docs]
@dataclasses.dataclass
class TechniqueMetadata:
"""Set of techniques with associated metadata for file (BLISS scan info)
and data portal (ICAT dataset metafata)."""
techniques: Set[Technique]
[docs]
def get_scan_metadata(
self,
) -> Optional[Dict[str, Union[List[str], Dict[str, str]]]]:
if self.techniques:
return self._get_nxentry_children()
return None
[docs]
def get_scan_info(self) -> Dict[str, Union[List[str], Dict[str, str]]]:
if not self.techniques:
return dict()
return {
BLISS_SCANINFO_CATEGORY: self._get_nxentry_children(),
"scan_meta_categories": [BLISS_SCANINFO_CATEGORY],
}
[docs]
def fill_scan_info(self, scan_info: MutableMapping) -> None:
if not self.techniques:
return
scan_meta_categories = scan_info.setdefault("scan_meta_categories", list())
if BLISS_SCANINFO_CATEGORY not in scan_meta_categories:
scan_meta_categories.append(BLISS_SCANINFO_CATEGORY)
nxentry_children = scan_info.get(BLISS_SCANINFO_CATEGORY)
if nxentry_children is None:
nxentry_children = scan_info[BLISS_SCANINFO_CATEGORY] = dict()
self._fill_nxentry_children(nxentry_children)
def _get_nxentry_children(self) -> Dict[str, str]:
nxentry_children = dict()
sorted_techniques = self._get_sorted_techniques()
for i, technique in enumerate(sorted_techniques, 1):
key = f"{_NEXUS_IDENTIFIER_PREFIX}{i}"
nxentry_children[key] = technique.versioned_iri
nxentry_children[f"{key}@type"] = "W3ID"
return nxentry_children
def _fill_nxentry_children(self, nxentry_children: MutableMapping) -> None:
sorted_techniques = self._get_sorted_techniques()
existing = {
key: value
for key, value in nxentry_children.items()
if key.startswith(_NEXUS_IDENTIFIER_PREFIX) and not key.endswith("@type")
}
existing_iris = set(existing.values())
used_indices = {int(key.split("_")[-1]) for key in existing}
next_index = max(used_indices, default=0) + 1
for technique in sorted_techniques:
if technique.iri in existing_iris:
continue
key = f"{_NEXUS_IDENTIFIER_PREFIX}{next_index}"
nxentry_children[key] = technique.versioned_iri
nxentry_children[f"{key}@type"] = "W3ID"
next_index += 1
def _get_sorted_techniques(self) -> List[Technique]:
return sorted(self.techniques, key=lambda technique: technique.primary_name)
[docs]
def fill_dataset_metadata(self, dataset: MutableMapping) -> None:
if not self.techniques:
return
# The 'dataset' object from Bliss handles mutable mappings by only using
# __getitem__ and __setitem__
# https://gitlab.esrf.fr/bliss/bliss/-/blob/master/bliss/icat/policy.py
# Get existing dataset technique names and pid's
try:
definitions = dataset["definition"].split(" ")
except KeyError:
definitions = list()
try:
pids = dataset["technique_pid"].split(" ")
except KeyError:
pids = list()
# Add technique names and pid's
techniques = dict(zip(pids, definitions))
for technique in self.techniques:
techniques[technique.iri] = technique.primary_name
# Replace ICAT metadata associated to 'techniques'
metadata = self._get_icat_metadata(techniques)
for key, value in metadata.items():
try:
dataset[key] = value
except KeyError:
if key in ("technique_pid", "technique_pid_esrfet_version"):
_logger.warning(
f"Skip ICAT field '{key}' (requires pyicat-plus>=0.2)"
)
continue
raise
[docs]
def get_dataset_metadata(self) -> Dict[str, str]:
if not self.techniques:
return dict()
techniques = {
technique.iri: technique.primary_name for technique in self.techniques
}
return self._get_icat_metadata(techniques)
def _get_icat_metadata(self, techniques: Dict[str, str]) -> Dict[str, str]:
if not techniques:
return dict()
iris, definitions = zip(*sorted(techniques.items(), key=lambda tpl: tpl[1]))
metadata = {
"technique_pid": " ".join(iris),
"definition": " ".join(definitions),
}
if self.techniques:
metadata["technique_pid_esrfet_version"] = (
self._get_ontology_version_number()
)
return metadata
def _get_ontology_version_number(self) -> Optional[str]:
if self.techniques:
return next(iter(self.techniques)).ontology_version.lstrip("v")
return None