Source code for esrf_ontologies.technique.types
import dataclasses
import logging
from typing import Dict
from typing import List
from typing import MutableMapping
from typing import Optional
from typing import Set
from typing import Tuple
from typing import Union
_logger = logging.getLogger(__name__)
[docs]
@dataclasses.dataclass(frozen=True)
class Technique:
"""Technique defined in an Ontology"""
iri: str # Internationalized Resource Identifier
names: Tuple[str] # Human readable name (first is the perferred one)
description: str # Human readable description
ontology_version: str # Ontology version extracted from OWL
@property
def primary_name(self) -> str:
return self.names[0]
@property
def versioned_iri(self) -> str:
"""Return versioned IRI derived from stable IRI and ontology version"""
base, fragment = self.iri.split("#", 1)
return f"{base}/{self.ontology_version}/#{fragment}"
BLISS_SCANINFO_CATEGORY = ""
_NEXUS_IDENTIFIER_PREFIX = "identifier_technique_"
[docs]
@dataclasses.dataclass
class TechniqueMetadata:
"""Set of techniques with associated metadata for file (BLISS scan info)
and data portal (ICAT dataset metafata)."""
techniques: Set[Technique]
[docs]
def get_scan_metadata(
self,
) -> Optional[Dict[str, Union[List[str], Dict[str, str]]]]:
if self.techniques:
return self._get_nxentry_children()
[docs]
def get_scan_info(self) -> Dict[str, Union[List[str], Dict[str, str]]]:
if not self.techniques:
return dict()
return {
BLISS_SCANINFO_CATEGORY: self._get_nxentry_children(),
"scan_meta_categories": [BLISS_SCANINFO_CATEGORY],
}
[docs]
def fill_scan_info(self, scan_info: MutableMapping) -> None:
if not self.techniques:
return
scan_meta_categories = scan_info.setdefault("scan_meta_categories", list())
if BLISS_SCANINFO_CATEGORY not in scan_meta_categories:
scan_meta_categories.append(BLISS_SCANINFO_CATEGORY)
nxentry_children = scan_info.get(BLISS_SCANINFO_CATEGORY)
if nxentry_children is None:
nxentry_children = scan_info[BLISS_SCANINFO_CATEGORY] = dict()
self._fill_nxentry_children(nxentry_children)
def _get_nxentry_children(self) -> Dict[str, str]:
nxentry_children = dict()
sorted_techniques = self._get_sorted_techniques()
for i, technique in enumerate(sorted_techniques, 1):
key = f"{_NEXUS_IDENTIFIER_PREFIX}{i}"
nxentry_children[key] = technique.versioned_iri
nxentry_children[f"{key}@type"] = "W3ID"
return nxentry_children
def _fill_nxentry_children(self, nxentry_children: MutableMapping) -> None:
sorted_techniques = self._get_sorted_techniques()
existing = {
key: value
for key, value in nxentry_children.items()
if key.startswith(_NEXUS_IDENTIFIER_PREFIX) and not key.endswith("@type")
}
existing_iris = set(existing.values())
used_indices = {int(key.split("_")[-1]) for key in existing}
next_index = max(used_indices, default=0) + 1
for technique in sorted_techniques:
if technique.iri in existing_iris:
continue
key = f"{_NEXUS_IDENTIFIER_PREFIX}{next_index}"
nxentry_children[key] = technique.versioned_iri
nxentry_children[f"{key}@type"] = "W3ID"
next_index += 1
def _get_sorted_techniques(self) -> List[Technique]:
return sorted(self.techniques, key=lambda technique: technique.primary_name)
[docs]
def fill_dataset_metadata(self, dataset: MutableMapping) -> None:
if not self.techniques:
return
# Currently handles mutable mappings by only using __getitem__ and __setitem__
# https://gitlab.esrf.fr/bliss/bliss/-/blob/master/bliss/icat/policy.py
try:
definitions = dataset["definition"].split(" ")
except KeyError:
definitions = list()
try:
pids = dataset["technique_pid"].split(" ")
except KeyError:
pids = list()
techniques = dict(zip(pids, definitions))
for technique in self.techniques:
techniques[technique.iri] = technique.primary_name
metadata = self._get_icat_metadata(techniques)
ontology_version = self._get_ontology_version_number()
metadata["technique_pid_esrfet_version"] = ontology_version
for key, value in metadata.items():
try:
dataset[key] = value
except KeyError:
if key in ("technique_pid", "technique_pid_esrfet_version"):
_logger.warning(
f"Skip ICAT field '{key}' (requires pyicat-plus>=0.2)"
)
continue
raise
def _get_ontology_version_number(self) -> str:
return next(iter(self.techniques)).ontology_version.lstrip("v")
[docs]
def get_dataset_metadata(self) -> Dict[str, str]:
if not self.techniques:
return dict()
techniques = {
technique.iri: technique.primary_name for technique in self.techniques
}
return self._get_icat_metadata(techniques)
def _get_icat_metadata(self, techniques: Dict[str, str]) -> Dict[str, str]:
iris, definitions = zip(*sorted(techniques.items(), key=lambda tpl: tpl[1]))
metadata = {
"technique_pid": " ".join(iris),
"definition": " ".join(definitions),
}
if self.techniques:
metadata["technique_pid_esrfet_version"] = (
self._get_ontology_version_number()
)
return metadata