nwb-linkml/nwb_linkml/adapters/namespaces.py

"""
Namespaces adapter

Wraps the :class:`nwb_schema_language.Namespaces` and other objects with convenience methods
for extracting information and generating translated schema
"""
import pdb
from typing import List, Optional
from pathlib import Path
from pydantic import BaseModel, Field, validator, PrivateAttr
from pprint import pformat
from linkml_runtime.linkml_model import SchemaDefinition
from linkml_runtime.dumpers import yaml_dumper


from nwb_schema_language import Namespaces

from nwb_linkml.adapters.adapter import Adapter, BuildResult
from nwb_linkml.adapters.schema import SchemaAdapter
from nwb_linkml.lang_elements import NwbLangSchema

class NamespacesAdapter(Adapter):
    namespaces: Namespaces
    schemas: List[SchemaAdapter]
    imported: List['NamespacesAdapter'] = Field(default_factory=list)

    _imports_populated: bool = PrivateAttr(False)
    _split: bool = PrivateAttr(False)

    def __init__(self, **kwargs):
        super(NamespacesAdapter, self).__init__(**kwargs)
        self._populate_schema_namespaces()
        self.split = self._split

    def build(self) -> BuildResult:
        if not self._imports_populated:
            self.populate_imports()


        sch_result = BuildResult()
        for sch in self.schemas:
            sch_result += sch.build()
        # recursive step
        for imported in self.imported:
            imported_build = imported.build()
            sch_result += imported_build

        # add in monkeypatch nwb types
        sch_result.schemas.append(NwbLangSchema)

        # now generate the top-level namespaces that import everything
        for ns in self.namespaces.namespaces:
            ns_schemas = [sch.name for sch in self.schemas if sch.namespace == ns.name]
            # also add imports bc, well, we need them
            ns_schemas.extend([ns.name for imported in self.imported for ns in imported.namespaces.namespaces])
            ns_schema = SchemaDefinition(
                name = ns.name,
                id = ns.name,
                description = ns.doc,
                version = ns.version,
                imports=ns_schemas,
                annotations=[{'tag': 'namespace', 'value': True}]
            )
            sch_result.schemas.append(ns_schema)

        return sch_result

    @property
    def split(self) -> bool:
        """
        Sets the :attr:`.SchemaAdapter.split` attribute for all contained and imported schema

        Args:
            split (bool): Set the generated schema to be split or not

        Returns:
            bool: whether the schema are set to be split!
        """
        return self._split

    @split.setter
    def split(self, split):
        for sch in self.schemas:
            sch.split = split
        for ns in self.imported:
            for sch in ns.schemas:
                sch.split = split

        self._split = split

    def _populate_schema_namespaces(self):
        # annotate for each schema which namespace imports it
        for sch in self.schemas:
            # imports seem to always be from same folder, so we can just use name part
            sch_name = sch.path.name
            # find which namespace imports this schema file
            for ns in self.namespaces.namespaces:
                sources = [sch.source for sch in ns.schema_]
                if sch_name in sources or sch.path.stem in sources:
                    sch.namespace = ns.name
                    break


    def find_type_source(self, name:str) -> SchemaAdapter:
        """
        Given some neurodata_type_inc, find the schema that it's defined in.

        Rather than returning as soon as a match is found, check all
        """
        # First check within the main schema
        internal_matches = []
        for schema in self.schemas:
            class_names = [cls.neurodata_type_def for cls in schema.created_classes]
            if name in class_names:
                internal_matches.append(schema)

        if len(internal_matches) > 1:
            raise KeyError(
                f"Found multiple schemas in namespace that define {name}:\ninternal: {pformat(internal_matches)}\nimported:{pformat(import_matches)}")
        elif len(internal_matches) == 1:
            return internal_matches[0]

        import_matches = []
        for imported_ns in self.imported:
            for schema in imported_ns.schemas:
                class_names = [cls.neurodata_type_def for cls in schema.created_classes]
                if name in class_names:
                    import_matches.append(schema)

        if len(import_matches)>1:
            raise KeyError(f"Found multiple schemas in namespace that define {name}:\ninternal: {pformat(internal_matches)}\nimported:{pformat(import_matches)}")
        elif len(import_matches) == 1:
            return import_matches[0]
        else:
            raise KeyError(f"No schema found that define {name}")

    def populate_imports(self):
        """
        Populate the imports that are needed for each schema file

        """
        for sch in self.schemas:
            for needs in sch.needed_imports:
                # shouldn't be recursive references, since imports should form a tree
                depends_on = self.find_type_source(needs)
                if depends_on not in sch.imports:
                    sch.imports.append(depends_on)

        # do so recursively
        for imported in self.imported:
            imported.populate_imports()

        self._imports_populated = True

    def to_yaml(self, base_dir:Path):
        schemas = self.build().schemas
        base_dir = Path(base_dir)

        base_dir.mkdir(exist_ok=True)

        for schema in schemas:
            output_file = base_dir / (schema.name + '.yaml')
            yaml_dumper.dump(schema, output_file)
Actually generating some translations at this point 2023-08-22 04:43:02 +00:00			`"""`
			`Namespaces adapter`

			Wraps the :class:`nwb_schema_language.Namespaces` and other objects with convenience methods
			`for extracting information and generating translated schema`
			`"""`
			`import pdb`
			`from typing import List, Optional`
- Able to complete build all the way through to importing generated classes 2023-09-05 04:46:17 +00:00			`from pathlib import Path`
recursion works, more formal build method in adapters 2023-08-24 02:56:09 +00:00			`from pydantic import BaseModel, Field, validator, PrivateAttr`
Actually generating some translations at this point 2023-08-22 04:43:02 +00:00			`from pprint import pformat`
recursion works, more formal build method in adapters 2023-08-24 02:56:09 +00:00			`from linkml_runtime.linkml_model import SchemaDefinition`
- Able to complete build all the way through to importing generated classes 2023-09-05 04:46:17 +00:00			`from linkml_runtime.dumpers import yaml_dumper`

Actually generating some translations at this point 2023-08-22 04:43:02 +00:00
			`from nwb_schema_language import Namespaces`

recursion works, more formal build method in adapters 2023-08-24 02:56:09 +00:00			`from nwb_linkml.adapters.adapter import Adapter, BuildResult`
Actually generating some translations at this point 2023-08-22 04:43:02 +00:00			`from nwb_linkml.adapters.schema import SchemaAdapter`
recursion works, more formal build method in adapters 2023-08-24 02:56:09 +00:00			`from nwb_linkml.lang_elements import NwbLangSchema`
Actually generating some translations at this point 2023-08-22 04:43:02 +00:00
			`class NamespacesAdapter(Adapter):`
			`namespaces: Namespaces`
			`schemas: List[SchemaAdapter]`
			`imported: List['NamespacesAdapter'] = Field(default_factory=list)`

- Don't split schema into includes and base - Import top-level classes in namespaces pydantic file - Don't generate or import the arraylike class 2023-09-04 21:56:36 +00:00			`_imports_populated: bool = PrivateAttr(False)`
			`_split: bool = PrivateAttr(False)`
Actually generating some translations at this point 2023-08-22 04:43:02 +00:00
			`def __init__(self, **kwargs):`
			`super(NamespacesAdapter, self).__init__(**kwargs)`
			`self._populate_schema_namespaces()`
- Don't split schema into includes and base - Import top-level classes in namespaces pydantic file - Don't generate or import the arraylike class 2023-09-04 21:56:36 +00:00			`self.split = self._split`
Actually generating some translations at this point 2023-08-22 04:43:02 +00:00
recursion works, more formal build method in adapters 2023-08-24 02:56:09 +00:00			`def build(self) -> BuildResult:`
			`if not self._imports_populated:`
			`self.populate_imports()`


			`sch_result = BuildResult()`
			`for sch in self.schemas:`
			`sch_result += sch.build()`
			`# recursive step`
			`for imported in self.imported:`
			`imported_build = imported.build()`
			`sch_result += imported_build`

			`# add in monkeypatch nwb types`
			`sch_result.schemas.append(NwbLangSchema)`

			`# now generate the top-level namespaces that import everything`
			`for ns in self.namespaces.namespaces:`
- Able to complete build all the way through to importing generated classes 2023-09-05 04:46:17 +00:00			`ns_schemas = [sch.name for sch in self.schemas if sch.namespace == ns.name]`
			`# also add imports bc, well, we need them`
			`ns_schemas.extend([ns.name for imported in self.imported for ns in imported.namespaces.namespaces])`
recursion works, more formal build method in adapters 2023-08-24 02:56:09 +00:00			`ns_schema = SchemaDefinition(`
			`name = ns.name,`
			`id = ns.name,`
			`description = ns.doc,`
			`version = ns.version,`
- Able to complete build all the way through to importing generated classes 2023-09-05 04:46:17 +00:00			`imports=ns_schemas,`
- Don't split schema into includes and base - Import top-level classes in namespaces pydantic file - Don't generate or import the arraylike class 2023-09-04 21:56:36 +00:00			`annotations=[{'tag': 'namespace', 'value': True}]`
recursion works, more formal build method in adapters 2023-08-24 02:56:09 +00:00			`)`
			`sch_result.schemas.append(ns_schema)`

			`return sch_result`

- Don't split schema into includes and base - Import top-level classes in namespaces pydantic file - Don't generate or import the arraylike class 2023-09-04 21:56:36 +00:00			`@property`
			`def split(self) -> bool:`
			`"""`
			Sets the :attr:`.SchemaAdapter.split` attribute for all contained and imported schema

			`Args:`
			`split (bool): Set the generated schema to be split or not`

			`Returns:`
			`bool: whether the schema are set to be split!`
			`"""`
			`return self._split`

			`@split.setter`
			`def split(self, split):`
			`for sch in self.schemas:`
			`sch.split = split`
			`for ns in self.imported:`
			`for sch in ns.schemas:`
			`sch.split = split`

			`self._split = split`

Actually generating some translations at this point 2023-08-22 04:43:02 +00:00			`def _populate_schema_namespaces(self):`
			`# annotate for each schema which namespace imports it`
			`for sch in self.schemas:`
			`# imports seem to always be from same folder, so we can just use name part`
			`sch_name = sch.path.name`
			`# find which namespace imports this schema file`
			`for ns in self.namespaces.namespaces:`
			`sources = [sch.source for sch in ns.schema_]`
- Able to complete build all the way through to importing generated classes 2023-09-05 04:46:17 +00:00			`if sch_name in sources or sch.path.stem in sources:`
Actually generating some translations at this point 2023-08-22 04:43:02 +00:00			`sch.namespace = ns.name`
			`break`



			`def find_type_source(self, name:str) -> SchemaAdapter:`
			`"""`
			`Given some neurodata_type_inc, find the schema that it's defined in.`
Working recursion! and also handling multiple array shapes, and properly handling unnamed classes 2023-09-01 03:56:21 +00:00
			`Rather than returning as soon as a match is found, check all`
Actually generating some translations at this point 2023-08-22 04:43:02 +00:00			`"""`
			`# First check within the main schema`
			`internal_matches = []`
			`for schema in self.schemas:`
			`class_names = [cls.neurodata_type_def for cls in schema.created_classes]`
			`if name in class_names:`
			`internal_matches.append(schema)`

Working recursion! and also handling multiple array shapes, and properly handling unnamed classes 2023-09-01 03:56:21 +00:00			`if len(internal_matches) > 1:`
			`raise KeyError(`
			`f"Found multiple schemas in namespace that define {name}:\ninternal: {pformat(internal_matches)}\nimported:{pformat(import_matches)}")`
			`elif len(internal_matches) == 1:`
			`return internal_matches[0]`

Actually generating some translations at this point 2023-08-22 04:43:02 +00:00			`import_matches = []`
			`for imported_ns in self.imported:`
			`for schema in imported_ns.schemas:`
			`class_names = [cls.neurodata_type_def for cls in schema.created_classes]`
			`if name in class_names:`
			`import_matches.append(schema)`

Working recursion! and also handling multiple array shapes, and properly handling unnamed classes 2023-09-01 03:56:21 +00:00			`if len(import_matches)>1:`
Actually generating some translations at this point 2023-08-22 04:43:02 +00:00			`raise KeyError(f"Found multiple schemas in namespace that define {name}:\ninternal: {pformat(internal_matches)}\nimported:{pformat(import_matches)}")`
Working recursion! and also handling multiple array shapes, and properly handling unnamed classes 2023-09-01 03:56:21 +00:00			`elif len(import_matches) == 1:`
			`return import_matches[0]`
Actually generating some translations at this point 2023-08-22 04:43:02 +00:00			`else:`
			`raise KeyError(f"No schema found that define {name}")`

			`def populate_imports(self):`
			`"""`
			`Populate the imports that are needed for each schema file`

			`"""`
			`for sch in self.schemas:`
			`for needs in sch.needed_imports:`
			`# shouldn't be recursive references, since imports should form a tree`
			`depends_on = self.find_type_source(needs)`
			`if depends_on not in sch.imports:`
			`sch.imports.append(depends_on)`

recursion works, more formal build method in adapters 2023-08-24 02:56:09 +00:00			`# do so recursively`
			`for imported in self.imported:`
			`imported.populate_imports()`

			`self._imports_populated = True`

- Able to complete build all the way through to importing generated classes 2023-09-05 04:46:17 +00:00			`def to_yaml(self, base_dir:Path):`
			`schemas = self.build().schemas`
			`base_dir = Path(base_dir)`

			`base_dir.mkdir(exist_ok=True)`

			`for schema in schemas:`
			`output_file = base_dir / (schema.name + '.yaml')`
			`yaml_dumper.dump(schema, output_file)`

Actually generating some translations at this point 2023-08-22 04:43:02 +00:00