From 71b2d1845b66374670a2965c4cac15b9ad130dc0 Mon Sep 17 00:00:00 2001
From: wpbonelli <wpbonelli@gmail.com>
Date: Thu, 7 Aug 2025 17:31:43 -0400
Subject: [PATCH 01/13] feat(dfn): distinguish file format from schema version

---
 autotest/test_dfn.py                 |   5 +-
 modflow_devtools/dfn.py              | 794 ---------------------------
 modflow_devtools/dfn/__init__.py     | 459 ++++++++++++++++
 modflow_devtools/dfn/fetch.py        |  29 +
 modflow_devtools/dfn/parse.py        | 182 ++++++
 modflow_devtools/dfn/schema/block.py |  22 +
 modflow_devtools/dfn/schema/field.py |  39 ++
 modflow_devtools/dfn/schema/ref.py   |  13 +
 modflow_devtools/dfn/schema/v1.py    |  22 +
 modflow_devtools/dfn/schema/v2.py    |  18 +
 modflow_devtools/dfn2toml.py         |  76 +--
 11 files changed, 809 insertions(+), 850 deletions(-)
 delete mode 100644 modflow_devtools/dfn.py
 create mode 100644 modflow_devtools/dfn/__init__.py
 create mode 100644 modflow_devtools/dfn/fetch.py
 create mode 100644 modflow_devtools/dfn/parse.py
 create mode 100644 modflow_devtools/dfn/schema/block.py
 create mode 100644 modflow_devtools/dfn/schema/field.py
 create mode 100644 modflow_devtools/dfn/schema/ref.py
 create mode 100644 modflow_devtools/dfn/schema/v1.py
 create mode 100644 modflow_devtools/dfn/schema/v2.py

diff --git a/autotest/test_dfn.py b/autotest/test_dfn.py
index e5158c8e..a1810968 100644
--- a/autotest/test_dfn.py
+++ b/autotest/test_dfn.py
@@ -2,7 +2,8 @@
 
 import pytest
 
-from modflow_devtools.dfn import Dfn, get_dfns
+from modflow_devtools.dfn import Dfn
+from modflow_devtools.dfn.fetch import fetch_dfns
 from modflow_devtools.dfn2toml import convert
 from modflow_devtools.markers import requires_pkg
 
@@ -18,7 +19,7 @@
 def pytest_generate_tests(metafunc):
     if "dfn_name" in metafunc.fixturenames:
         if not any(DFN_DIR.glob("*.dfn")):
-            get_dfns(MF6_OWNER, MF6_REPO, MF6_REF, DFN_DIR, verbose=True)
+            fetch_dfns(MF6_OWNER, MF6_REPO, MF6_REF, DFN_DIR, verbose=True)
         dfn_names = [
             dfn.stem
             for dfn in DFN_DIR.glob("*.dfn")
diff --git a/modflow_devtools/dfn.py b/modflow_devtools/dfn.py
deleted file mode 100644
index 9a543ec0..00000000
--- a/modflow_devtools/dfn.py
+++ /dev/null
@@ -1,794 +0,0 @@
-"""
-MODFLOW 6 definition file tools. Includes types for field
-and component specification, a parser for the original
-DFN format as well as for TOML definition files, and
-a function to fetch DFNs from the MF6 repository.
-"""
-
-import shutil
-import tempfile
-from ast import literal_eval
-from collections.abc import Mapping
-from itertools import groupby
-from os import PathLike
-from pathlib import Path
-from typing import (
-    Any,
-    Literal,
-    Optional,
-    TypedDict,
-)
-from warnings import warn
-
-import tomli
-from boltons.dictutils import OMD
-from boltons.iterutils import remap
-
-from modflow_devtools.download import download_and_unzip
-from modflow_devtools.misc import try_literal_eval
-
-
-def try_parse_bool(value: Any) -> Any:
-    """
-    Try to parse a boolean from a string as represented
-    in a DFN file, otherwise return the value unaltered.
-    """
-    if isinstance(value, str):
-        value = value.lower()
-        if value in ["true", "false"]:
-            return value == "true"
-    return value
-
-
-def field_attr_sort_key(item) -> int:
-    """
-    Sort key for input field attributes. The order is:
-    -1. block
-    0. name
-    1. type
-    2. shape
-    3. default
-    4. reader
-    5. optional
-    6. longname
-    7. description
-    """
-
-    k, _ = item
-    if k == "block":
-        return -1
-    if k == "name":
-        return 0
-    if k == "type":
-        return 1
-    if k == "shape":
-        return 2
-    if k == "default":
-        return 3
-    if k == "reader":
-        return 4
-    if k == "optional":
-        return 5
-    if k == "longname":
-        return 6
-    if k == "description":
-        return 7
-    return 8
-
-
-def block_sort_key(item) -> int:
-    k, _ = item
-    if k == "options":
-        return 0
-    elif k == "dimensions":
-        return 1
-    elif k == "griddata":
-        return 2
-    elif k == "packagedata":
-        return 3
-    elif "period" in k:
-        return 4
-    else:
-        return 5
-
-
-FormatVersion = Literal[1, 2]
-"""DFN format version number."""
-
-
-FieldType = Literal[
-    "keyword",
-    "integer",
-    "double precision",
-    "string",
-    "record",
-    "recarray",
-    "keystring",
-]
-
-
-Reader = Literal[
-    "urword",
-    "u1ddbl",
-    "u2ddbl",
-    "readarray",
-]
-
-
-SCALAR_TYPES = ("keyword", "integer", "double precision", "string")
-_SCALAR_TYPES = SCALAR_TYPES  # allow backwards compat; imported by flopy
-
-
-Dfns = dict[str, "Dfn"]
-Fields = dict[str, "Field"]
-Block = Fields
-Blocks = dict[str, Block]
-
-
-def get_blocks(dfn: "Dfn") -> Blocks:
-    """
-    Extract blocks from an input definition.
-    """
-
-    def _is_block(item: tuple[str, Any]) -> bool:
-        k, _v = item
-        return k not in Dfn.__annotations__
-
-    return dict(
-        sorted(
-            {k: v for k, v in dfn.items() if _is_block((k, v))}.items(),  # type: ignore
-            key=block_sort_key,
-        )
-    )
-
-
-def get_fields(dfn: "Dfn") -> Fields:
-    """
-    Extract a flat dictionary of fields from an input definition.
-    Only top-level fields are included, i.e. subfields of records
-    or recarrays are not included.
-    """
-    fields = {}
-    for block in get_blocks(dfn).values():
-        for field in block.values():
-            if field["name"] in fields:
-                warn(f"Duplicate field name {field['name']} in {dfn['name']}")
-            fields[field["name"]] = field
-    return fields
-
-
-class Field(TypedDict):
-    """A field specification."""
-
-    name: str
-    type: FieldType
-    shape: Any | None
-    block: str | None
-    default: Any | None
-    children: Optional["Fields"]
-    description: str | None
-    reader: Reader
-
-
-class Ref(TypedDict):
-    """
-    A foreign-key-like reference between a file input variable
-    in a referring input component and another input component
-    referenced by it. Previously known as a "subpackage".
-
-    A `Dfn` with a nonempty `ref` can be referred to by other
-    component definitions, via a filepath variable which acts
-    as a foreign key. If such a variable is detected when any
-    component is loaded, the component's `__init__` method is
-    modified, such that the variable named `val`, residing in
-    the referenced component, replaces the variable with name
-    `key` in the referencing component, i.e., the foreign key
-    filepath variable, This forces a referencing component to
-    accept a subcomponent's data directly, as if it were just
-    a variable, rather than indirectly, with the subcomponent
-    loaded up from a file identified by the filepath variable.
-    """
-
-    key: str
-    val: str
-    abbr: str
-    param: str
-    parent: str
-    description: str | None
-
-
-class Sln(TypedDict):
-    """
-    A solution package specification.
-    """
-
-    abbr: str
-    pattern: str
-
-
-class Dfn(TypedDict):
-    """
-    MODFLOW 6 input definition. An input definition
-    specifies a component in an MF6 simulation, e.g.
-    a model or package. A component contains input
-    variables, and may contain other metadata such
-    as foreign key references to other components
-    (i.e. subpackages), package-specific metadata
-    (e.g. for solutions), advanced package status,
-    and whether the component is a multi-package.
-
-    An input definition must have a name. Other top-
-    level keys are blocks, which must be mappings of
-    `str` to `Field`, and metadata, of which only a
-    limited set of keys are allowed. Block names and
-    metadata keys may not overlap.
-    """
-
-    name: str
-    advanced: bool
-    multi: bool
-    parent: str | None
-    ref: Ref | None
-    sln: Sln | None
-
-    @staticmethod  # type: ignore[misc]
-    def _load_v1_flat(f, common: dict | None = None) -> tuple[Mapping, list[str]]:
-        field = {}
-        flat = []
-        meta = []
-        common = common or {}
-
-        for line in f:
-            # remove whitespace/etc from the line
-            line = line.strip()
-
-            # record context name and flopy metadata
-            # attributes, skip all other comment lines
-            if line.startswith("#"):
-                _, sep, tail = line.partition("flopy")
-                if sep == "flopy":
-                    if (
-                        "multi-package" in tail
-                        or "solution_package" in tail
-                        or "subpackage" in tail
-                        or "parent" in tail
-                    ):
-                        meta.append(tail.strip())
-                _, sep, tail = line.partition("package-type")
-                if sep == "package-type":
-                    meta.append(f"package-type {tail.strip()}")
-                continue
-
-            # if we hit a newline and the parameter dict
-            # is nonempty, we've reached the end of its
-            # block of attributes
-            if not any(line):
-                if any(field):
-                    flat.append((field["name"], field))
-                    field = {}
-                continue
-
-            # split the attribute's key and value and
-            # store it in the parameter dictionary
-            key, _, value = line.partition(" ")
-            if key == "default_value":
-                key = "default"
-            field[key] = value
-
-            # make substitutions from common variable definitions,
-            # remove backslashes, TODO: generate/insert citations.
-            descr = field.get("description", None)
-            if descr:
-                descr = descr.replace("\\", "").replace("``", "'").replace("''", "'")
-                _, replace, tail = descr.strip().partition("REPLACE")
-                if replace:
-                    key, _, subs = tail.strip().partition(" ")
-                    subs = literal_eval(subs)
-                    cmmn = common.get(key, None)
-                    if cmmn is None:
-                        warn(
-                            "Can't substitute description text, "
-                            f"common variable not found: {key}"
-                        )
-                    else:
-                        descr = cmmn.get("description", "")
-                        if any(subs):
-                            descr = descr.replace("\\", "").replace(
-                                "{#1}", subs["{#1}"]
-                            )
-                field["description"] = descr
-
-        # add the final parameter
-        if any(field):
-            flat.append((field["name"], field))
-
-        # the point of the OMD is to losslessly handle duplicate variable names
-        return OMD(flat), meta
-
-    @classmethod  # type: ignore[misc]
-    def _load_v1(cls, f, name, **kwargs) -> "Dfn":
-        """
-        Temporary load routine for the v1 DFN format.
-        """
-
-        flat, meta = Dfn._load_v1_flat(f, **kwargs)
-
-        def _convert_recarray_block(block: Block, block_name: str) -> Block:
-            """
-            Convert a recarray block to individual arrays, one per column.
-
-            Extract recarray fields and create separate array variables. For period
-            blocks, give each an appropriate grid- or time-aligned shape (nper, nnodes).
-            For other blocks, uses the declared dimensions directly.
-            """
-
-            fields = list(block.values())
-            if fields[0]["type"] == "recarray":
-                assert len(fields) == 1
-                recarray_field = fields[0]
-                recarray_name = recarray_field["name"]
-                item = next(iter(recarray_field["children"].values()))
-                columns = item["children"]
-
-                # Get the original recarray shape to determine base dimensions
-                recarray_shape = recarray_field.get("shape")
-                if recarray_shape:
-                    # Parse shape like "(nexg)" or "(maxbound)"
-                    base_dims = recarray_shape[1:-1].split(",")
-                    base_dims = [dim.strip() for dim in base_dims if dim.strip()]
-                else:
-                    base_dims = []
-            else:
-                recarray_name = None
-                columns = block
-                base_dims = []
-
-            # Remove the original recarray field
-            block.pop(recarray_name, None)
-
-            # Handle cellid specially - it indicates spatial indexing
-            cellid = columns.pop("cellid", None)
-
-            for col_name, column in columns.items():
-                col_copy = column.copy()
-                old_dims = col_copy.get("shape")
-                if old_dims:
-                    old_dims = old_dims[1:-1].split(",")
-                    old_dims = [dim.strip() for dim in old_dims if dim.strip()]
-                else:
-                    old_dims = []
-
-                # Determine new dimensions based on block type
-                if block_name == "period":
-                    # Period blocks get time + spatial dimensions
-                    new_dims = ["nper"]
-                    if cellid:
-                        new_dims.append("nnodes")
-                    # Add any additional dimensions, excluding maxbound
-                    if old_dims:
-                        new_dims.extend([dim for dim in old_dims if dim != "maxbound"])
-                else:
-                    # Non-period blocks use declared dimensions
-                    new_dims = []
-                    if base_dims:
-                        # Use the dimensions from the recarray shape
-                        # Only drop maxbound if there are other meaningful dimensions
-                        filtered_base_dims = [
-                            dim for dim in base_dims if dim != "maxbound"
-                        ]
-                        if filtered_base_dims:
-                            new_dims.extend(filtered_base_dims)
-                        else:
-                            # Keep maxbound if no other dimensions are available
-                            new_dims.extend(base_dims)
-                    # Add any column-specific dimensions
-                    if old_dims:
-                        filtered_old_dims = [
-                            dim for dim in old_dims if dim != "maxbound"
-                        ]
-                        if filtered_old_dims:
-                            new_dims.extend(filtered_old_dims)
-                        else:
-                            # Keep maxbound if no other dimensions are available
-                            new_dims.extend(old_dims)
-
-                if new_dims:
-                    col_copy["shape"] = f"({', '.join(new_dims)})"
-                else:
-                    # Scalar field
-                    col_copy["shape"] = None
-
-                block[col_name] = col_copy
-
-            return block
-
-        def _convert_field(var: dict[str, Any]) -> Field:
-            """
-            Convert an input field specification from its representation
-            in a v1 format definition file to the v2 (structured) format.
-
-            Notes
-            -----
-            If the field does not have a `default` attribute, it will
-            default to `False` if it is a keyword, otherwise to `None`.
-
-            A filepath field whose name functions as a foreign key
-            for a separate context will be given a reference to it.
-            """
-
-            def _load(field) -> Field:
-                field = field.copy()
-
-                # parse booleans from strings. everything else can
-                # stay a string except default values, which we'll
-                # try to parse as arbitrary literals below, and at
-                # some point types, once we introduce type hinting
-                field = {k: try_parse_bool(v) for k, v in field.items()}
-
-                _name = field.pop("name")
-                _type = field.pop("type", None)
-                shape = field.pop("shape", None)
-                shape = None if shape == "" else shape
-                block = field.pop("block", None)
-                default = field.pop("default", None)
-                default = try_literal_eval(default) if _type != "string" else default
-                description = field.pop("description", "")
-                reader = field.pop("reader", "urword")
-
-                def _item() -> Field:
-                    """Load list item."""
-
-                    item_names = _type.split()[1:]
-                    item_types = [
-                        v["type"]
-                        for v in flat.values(multi=True)
-                        if v["name"] in item_names and v.get("in_record", False)
-                    ]
-                    n_item_names = len(item_names)
-                    if n_item_names < 1:
-                        raise ValueError(f"Missing list definition: {_type}")
-
-                    # explicit record
-                    if n_item_names == 1 and (
-                        item_types[0].startswith("record")
-                        or item_types[0].startswith("keystring")
-                    ):
-                        return _convert_field(next(iter(flat.getlist(item_names[0]))))
-
-                    # implicit simple record (no children)
-                    if all(t in SCALAR_TYPES for t in item_types):
-                        return Field(
-                            name=_name,
-                            type="record",
-                            block=block,
-                            children=_fields(),
-                            description=description.replace(
-                                "is the list of", "is the record of"
-                            ),
-                            reader=reader,
-                            **field,
-                        )
-
-                    # implicit complex record (has children)
-                    fields = {
-                        v["name"]: _convert_field(v)
-                        for v in flat.values(multi=True)
-                        if v["name"] in item_names and v.get("in_record", False)
-                    }
-                    first = next(iter(fields.values()))
-                    single = len(fields) == 1
-                    item_type = (
-                        "keystring"
-                        if single and "keystring" in first["type"]
-                        else "record"
-                    )
-                    return Field(
-                        name=first["name"] if single else _name,
-                        type=item_type,
-                        block=block,
-                        children=first["children"] if single else fields,
-                        description=description.replace(
-                            "is the list of", f"is the {item_type} of"
-                        ),
-                        reader=reader,
-                        **field,
-                    )
-
-                def _choices() -> Fields:
-                    """Load keystring (union) choices."""
-                    names = _type.split()[1:]
-                    return {
-                        v["name"]: _convert_field(v)
-                        for v in flat.values(multi=True)
-                        if v["name"] in names and v.get("in_record", False)
-                    }
-
-                def _fields() -> Fields:
-                    """Load record fields."""
-                    names = _type.split()[1:]
-                    fields = {}
-                    for name in names:
-                        v = flat.get(name, None)
-                        if (
-                            not v
-                            or not v.get("in_record", False)
-                            or v["type"].startswith("record")
-                        ):
-                            continue
-                        fields[name] = _convert_field(v)
-                    return fields
-
-                var_ = Field(
-                    name=_name,
-                    shape=shape,
-                    block=block,
-                    description=description,
-                    default=default,
-                    reader=reader,
-                    **field,
-                )
-
-                if _type.startswith("recarray"):
-                    item = _item()
-                    var_["children"] = {item["name"]: item}
-                    var_["type"] = "recarray"
-
-                elif _type.startswith("keystring"):
-                    var_["children"] = _choices()
-                    var_["type"] = "keystring"
-
-                elif _type.startswith("record"):
-                    var_["children"] = _fields()
-                    var_["type"] = "record"
-
-                # for now, we can tell a var is an array if its type
-                # is scalar and it has a shape. once we have proper
-                # typing, this can be read off the type itself.
-                elif shape is not None and _type not in SCALAR_TYPES:
-                    raise TypeError(f"Unsupported array type: {_type}")
-
-                else:
-                    var_["type"] = _type
-
-                return var_
-
-            return dict(sorted(_load(var).items(), key=field_attr_sort_key))
-
-        # load top-level fields. any nested
-        # fields will be loaded recursively
-        fields = {
-            field["name"]: _convert_field(field)
-            for field in flat.values(multi=True)
-            if not field.get("in_record", False)
-        }
-
-        # group variables by block
-        blocks = {
-            block_name: {v["name"]: v for v in block}
-            for block_name, block in groupby(fields.values(), lambda v: v["block"])
-        }
-
-        # extract distinct arrays from recarray-style definitions in all blocks
-        for block_name, block in blocks.items():
-            # Check if this block contains any recarray fields
-            has_recarray = any(field["type"] == "recarray" for field in block.values())
-            if has_recarray:
-                blocks[block_name] = _convert_recarray_block(block, block_name)
-
-        # remove unneeded variable attributes
-        def remove_attrs(path, key, value):
-            if key in ["in_record", "tagged", "preserve_case"]:
-                return False
-            return True
-
-        blocks = remap(blocks, visit=remove_attrs)
-
-        def _advanced() -> bool | None:
-            return any("package-type advanced" in m for m in meta)
-
-        def _multi() -> bool:
-            return any("multi-package" in m for m in meta)
-
-        def _sln() -> Sln | None:
-            sln = next(
-                iter(
-                    m
-                    for m in meta
-                    if isinstance(m, str) and m.startswith("solution_package")
-                ),
-                None,
-            )
-            if sln:
-                abbr, pattern = sln.split()[1:]
-                return Sln(abbr=abbr, pattern=pattern)
-            return None
-
-        def _sub() -> Ref | None:
-            def _parent():
-                line = next(
-                    iter(
-                        m for m in meta if isinstance(m, str) and m.startswith("parent")
-                    ),
-                    None,
-                )
-                if not line:
-                    return None
-                split = line.split()
-                return split[1]
-
-            def _rest():
-                line = next(
-                    iter(
-                        m for m in meta if isinstance(m, str) and m.startswith("subpac")
-                    ),
-                    None,
-                )
-                if not line:
-                    return None
-                _, key, abbr, param, val = line.split()
-                matches = [v for v in fields.values() if v["name"] == val]
-                if not any(matches):
-                    descr = None
-                else:
-                    if len(matches) > 1:
-                        warn(f"Multiple matches for referenced variable {val}")
-                    match = matches[0]
-                    descr = match["description"]
-
-                return {
-                    "key": key,
-                    "val": val,
-                    "abbr": abbr,
-                    "param": param,
-                    "description": descr,
-                }
-
-            parent = _parent()
-            rest = _rest()
-            if parent and rest:
-                return Ref(parent=parent, **rest)
-            return None
-
-        sln = _sln()
-        multi = (
-            _multi()
-            or sln is not None
-            or ("nam" in name and "sim" not in name)
-            or name.startswith("exg-")
-        )
-
-        return cls(
-            name=name,
-            advanced=_advanced(),
-            multi=multi,
-            sln=sln,
-            ref=_sub(),
-            **blocks,
-        )
-
-    @classmethod  # type: ignore[misc]
-    def _load_v2(cls, f, name) -> "Dfn":
-        data = tomli.load(f)
-        if name and name != data.get("name", None):
-            raise ValueError(f"Name mismatch, expected {name}")
-        return cls(**data)
-
-    @classmethod  # type: ignore[misc]
-    def load(
-        cls,
-        f,
-        name: str | None = None,
-        version: FormatVersion = 1,
-        **kwargs,
-    ) -> "Dfn":
-        """
-        Load a component definition from a definition file.
-        """
-
-        if version == 1:
-            return cls._load_v1(f, name, **kwargs)
-        elif version == 2:
-            return cls._load_v2(f, name)
-        else:
-            raise ValueError(f"Unsupported version, expected one of {version.__args__}")
-
-    @staticmethod  # type: ignore[misc]
-    def _load_all_v1(dfndir: PathLike) -> Dfns:
-        paths: list[Path] = [
-            p for p in dfndir.glob("*.dfn") if p.stem not in ["common", "flopy"]
-        ]
-
-        # load common variables
-        common_path: Path | None = dfndir / "common.dfn"
-        if not common_path.is_file:
-            common = None
-        else:
-            with common_path.open() as f:
-                common, _ = Dfn._load_v1_flat(f)
-
-        # load definitions
-        dfns: Dfns = {}
-        for path in paths:
-            with path.open() as f:
-                dfn = Dfn.load(f, name=path.stem, common=common)
-                dfns[path.stem] = dfn
-
-        return dfns
-
-    @staticmethod  # type: ignore[misc]
-    def _load_all_v2(dfndir: PathLike) -> Dfns:
-        paths: list[Path] = [
-            p for p in dfndir.glob("*.toml") if p.stem not in ["common", "flopy"]
-        ]
-        dfns: Dfns = {}
-        for path in paths:
-            with path.open(mode="rb") as f:
-                dfn = Dfn.load(f, name=path.stem, version=2)
-                dfns[path.stem] = dfn
-
-        return dfns
-
-    @staticmethod  # type: ignore[misc]
-    def load_all(dfndir: PathLike, version: FormatVersion = 1) -> Dfns:
-        """Load all component definitions from the given directory."""
-        if version == 1:
-            return Dfn._load_all_v1(dfndir)
-        elif version == 2:
-            return Dfn._load_all_v2(dfndir)
-        else:
-            raise ValueError(f"Unsupported version, expected one of {version.__args__}")
-
-    @staticmethod  # type: ignore[misc]
-    def load_tree(dfndir: PathLike, version: FormatVersion = 2) -> dict:
-        """Load all definitions and return as hierarchical tree."""
-        dfns = Dfn.load_all(dfndir, version)
-        return infer_tree(dfns)
-
-
-def infer_tree(dfns: dict[str, Dfn]) -> dict:
-    """Infer the component hierarchy from definitions.
-
-    Enforces single root requirement - must be exactly one component
-    with no parent, and it must be named 'sim'.
-    """
-    roots = [name for name, dfn in dfns.items() if not dfn.get("parent")]
-
-    if len(roots) != 1:
-        raise ValueError(
-            f"Expected exactly one root component, found {len(roots)}: {roots}"
-        )
-
-    root_name = roots[0]
-    if root_name != "sim":
-        raise ValueError(f"Root component must be named 'sim', found '{root_name}'")
-
-    def add_children(node_name: str) -> dict[str, Any]:
-        node = dict(dfns[node_name])
-        children = [
-            name for name, dfn in dfns.items() if dfn.get("parent") == node_name
-        ]
-        for child in children:
-            node[child] = add_children(child)
-        return node
-
-    return {root_name: add_children(root_name)}
-
-
-def get_dfns(
-    owner: str, repo: str, ref: str, outdir: str | PathLike, verbose: bool = False
-):
-    """Fetch definition files from the MODFLOW 6 repository."""
-    url = f"https://github.com/{owner}/{repo}/archive/{ref}.zip"
-    if verbose:
-        print(f"Downloading MODFLOW 6 repository from {url}")
-    with tempfile.TemporaryDirectory() as tmp:
-        dl_path = download_and_unzip(url, Path(tmp), verbose=verbose)
-        contents = list(dl_path.glob("modflow6-*"))
-        proj_path = next(iter(contents), None)
-        if not proj_path:
-            raise ValueError(f"Missing proj dir in {dl_path}, found {contents}")
-        if verbose:
-            print("Copying dfns from download dir to output dir")
-        shutil.copytree(
-            proj_path / "doc" / "mf6io" / "mf6ivar" / "dfn", outdir, dirs_exist_ok=True
-        )
diff --git a/modflow_devtools/dfn/__init__.py b/modflow_devtools/dfn/__init__.py
new file mode 100644
index 00000000..51bf5b2c
--- /dev/null
+++ b/modflow_devtools/dfn/__init__.py
@@ -0,0 +1,459 @@
+"""
+MODFLOW 6 definition file tools.
+"""
+
+from abc import ABC, abstractmethod
+from dataclasses import asdict, dataclass, replace
+from itertools import groupby
+from os import PathLike
+from pathlib import Path
+from typing import (
+    Literal,
+)
+
+import tomli
+from boltons.dictutils import OMD
+from boltons.iterutils import remap
+from packaging.version import Version
+
+import modflow_devtools.dfn.schema.v1 as v1_schema
+from modflow_devtools.dfn.parse import (
+    is_advanced_package,
+    is_multi_package,
+    parse_dfn,
+    try_parse_bool,
+    try_parse_parent,
+)
+from modflow_devtools.dfn.schema.block import Block, Blocks
+from modflow_devtools.dfn.schema.field import SCALAR_TYPES, Field, Fields
+from modflow_devtools.dfn.schema.ref import Ref
+from modflow_devtools.dfn.schema.v1 import FieldV1
+from modflow_devtools.dfn.schema.v2 import FieldV2
+from modflow_devtools.misc import try_literal_eval
+
+Format = Literal["dfn", "toml"]
+"""DFN serialization format."""
+
+
+Dfns = dict[str, "Dfn"]
+
+
+@dataclass
+class Dfn:
+    """
+    MODFLOW 6 input component definition.
+    """
+
+    name: str
+    schema_version: Version
+    parent: str | None = None
+    advanced: bool = False
+    multi: bool = False
+    ref: Ref | None = None
+    blocks: Blocks | None = None
+    children: Dfns | None = None
+
+    @property
+    def fields(self) -> Fields:
+        """
+        Top-level fields in all blocks as a single dictionary.
+
+        Only top-level fields are included, i.e. subfields of records
+        or recarrays are not included.
+        """
+        fields = []
+        for block in (self.blocks or {}).values():
+            for field in block.values():
+                fields.append((field.name, field))
+        return OMD(fields)
+
+
+class SchemaMap(ABC):
+    @abstractmethod
+    def map(self, dfn: Dfn) -> Dfn: ...
+
+
+class MapV1To2(SchemaMap):
+    @staticmethod
+    def map_period_block(dfn: Dfn, block: Block) -> Block:
+        """
+        Convert a period block recarray to individual arrays, one per column.
+
+        Extracts recarray fields and creates separate array variables. Gives
+        each an appropriate grid- or tdis-aligned shape as opposed to sparse
+        list shape in terms of maxbound as previously.
+        """
+
+        block = dict(block)
+        fields = list(block.values())
+        if fields[0].type == "recarray":
+            assert len(fields) == 1
+            recarray_name = fields[0].name
+            block.pop(recarray_name, None)
+            item = next(iter((fields[0].children or {}).values()))
+            columns = dict(item.children or {})
+        else:
+            recarray_name = None
+            columns = block
+
+        cellid = columns.pop("cellid", None)
+        for col_name, column in columns.items():
+            old_dims = column.shape
+            if old_dims:
+                old_dims = old_dims[1:-1].split(",")  # type: ignore
+            new_dims = ["nper"]
+            if cellid:
+                new_dims.append("nnodes")
+            if old_dims:
+                new_dims.extend([dim for dim in old_dims if dim != "maxbound"])
+            block[col_name] = replace(column, shape=f"({', '.join(new_dims)})")
+
+        return block
+
+    @staticmethod
+    def map_field(dfn: Dfn, field: Field) -> Field:
+        """
+        Convert an input field specification from its representation
+        in a v1 format definition file to the v2 (structured) format.
+
+        Notes
+        -----
+        If the field does not have a `default` attribute, it will
+        default to `False` if it is a keyword, otherwise to `None`.
+
+        A filepath field whose name functions as a foreign key
+        for a separate context will be given a reference to it.
+        """
+
+        fields = dfn.fields
+
+        def _map_field(_field) -> Field:
+            _field = asdict(_field)
+            # parse booleans from strings. everything else can
+            # stay a string except default values, which we'll
+            # try to parse as arbitrary literals below, and at
+            # some point types, once we introduce type hinting
+            _field = {k: try_parse_bool(v) for k, v in _field.items()}
+            _name = _field.pop("name")
+            _type = _field.pop("type", None)
+            shape = _field.pop("shape", None)
+            shape = None if shape == "" else shape
+            block = _field.pop("block", None)
+            default = _field.pop("default", None)
+            default = try_literal_eval(default) if _type != "string" else default
+            description = _field.pop("description", "")
+
+            def _row_field() -> Field:
+                """Parse a table's record (row) field"""
+                item_names = _type.split()[1:]
+                item_types = [
+                    f.type
+                    for f in fields.values(multi=True)
+                    if f.name in item_names and f.in_record
+                ]
+                n_item_names = len(item_names)
+                if n_item_names < 1:
+                    raise ValueError(f"Missing list definition: {_type}")
+
+                # explicit record or keystring
+                if n_item_names == 1 and (
+                    item_types[0].startswith("record")
+                    or item_types[0].startswith("keystring")
+                ):
+                    return MapV1To2.map_field(
+                        dfn, next(iter(fields.getlist(item_names[0])))
+                    )
+
+                # implicit record with all scalar fields
+                if all(t in v1_schema._SCALAR_TYPES for t in item_types):
+                    return FieldV2.from_dict(
+                        {
+                            "name": _name,
+                            "type": "record",
+                            "block": block,
+                            "children": _record_fields(),
+                            "description": description.replace(
+                                "is the list of", "is the record of"
+                            ),
+                            **_field,
+                        }
+                    )
+
+                # implicit record with composite fields
+                children = {
+                    f.name: MapV1To2.map_field(dfn, f)
+                    for f in fields.values(multi=True)
+                    if f.name in item_names and f.in_record
+                }
+                first = next(iter(children.values()))
+                single = len(children) == 1
+                item_type = (
+                    "keystring" if single and "keystring" in first.type else "record"
+                )
+                return FieldV2.from_dict(
+                    {
+                        "name": first.name if single else _name,
+                        "type": item_type,
+                        "block": block,
+                        "children": first.children if single else children,
+                        "description": description.replace(
+                            "is the list of", f"is the {item_type} of"
+                        ),
+                        **_field,
+                    }
+                )
+
+            def _union_fields() -> Fields:
+                """Parse a union's fields"""
+                names = _type.split()[1:]
+                return {
+                    f.name: MapV1To2.map_field(dfn, f)
+                    for f in fields.values(multi=True)
+                    if f.name in names and f.in_record
+                }
+
+            def _record_fields() -> Fields:
+                """Parse a record's fields"""
+                names = _type.split()[1:]
+                children = {}
+                for name in names:
+                    child = children.get(name, None)
+                    if (
+                        not child
+                        or not child.in_record
+                        or child.type.startswith("record")
+                    ):
+                        continue
+                    children[name] = _map_field(child)
+                return children
+
+            _field = FieldV2.from_dict(
+                {
+                    "name": _name,
+                    "shape": shape,
+                    "block": block,
+                    "description": description,
+                    "default": default,
+                    **_field,
+                }
+            )
+
+            if _type.startswith("recarray"):
+                child = _row_field()
+                _field.children = {child.name: child}
+                _field.type = "recarray"
+
+            elif _type.startswith("keystring"):
+                _field.children = _union_fields()
+                _field.type = "keystring"
+
+            elif _type.startswith("record"):
+                _field.children = _record_fields()
+                _field.type = "record"
+
+            # for now, we can tell a var is an array if its type
+            # is scalar and it has a shape. once we have proper
+            # typing, this can be read off the type itself.
+            elif shape is not None and _type not in v1_schema._SCALAR_TYPES:
+                raise TypeError(f"Unsupported array type: {_type}")
+
+            else:
+                _field.type = _type
+
+            return _field
+
+        return _map_field(field)
+
+    @staticmethod
+    def map_blocks(dfn: Dfn) -> Blocks:
+        fields = {
+            field.name: MapV1To2.map_field(dfn, field)
+            for field in dfn.fields.values(multi=True)
+            if not field.in_record
+        }
+        blocks = {
+            block_name: {f.name: f for f in block}
+            for block_name, block in groupby(fields.values(), lambda f: f.block)
+        }
+        if (period_block := blocks.get("period", None)) is not None:
+            blocks["period"] = MapV1To2.map_period_block(dfn, period_block)
+
+        def remove_attrs(path, key, value):
+            # remove unneeded variable attributes
+            if key in ["in_record", "tagged", "preserve_case"]:
+                return False
+            return True
+
+        return remap(blocks, visit=remove_attrs)
+
+    def map(self, dfn: Dfn) -> Dfn:
+        if dfn.schema_version == Version("2"):
+            return dfn
+        return Dfn(
+            name=dfn.name,
+            advanced=dfn.advanced,
+            multi=dfn.multi,
+            ref=dfn.ref,
+            blocks=MapV1To2.map_blocks(dfn),
+        )
+
+
+def map(
+    dfn: Dfn,
+    schema_version: str | Version = "2",
+) -> Dfn:
+    """Map a MODFLOW 6 specification to another schema version."""
+    if dfn.schema_version == schema_version:
+        return dfn
+    elif Version(schema_version) == Version("1"):
+        raise NotImplementedError("Mapping to schema version 1 is not implemented yet.")
+    elif Version(schema_version) == Version("2"):
+        return MapV1To2().map(dfn)
+
+
+def load(f: str | PathLike, **kwargs) -> Dfn:
+    """Load a MODFLOW 6 definition file."""
+    path = Path(f).expanduser().resolve()
+    if path.suffix == ".dfn":
+        fields, meta = parse_dfn(path, **kwargs)
+        blocks = (
+            {}
+            if "common" in path.stem
+            else {
+                block_name: {field["name"]: FieldV1.from_dict(field) for field in block}
+                for block_name, block in groupby(
+                    fields.values(), lambda field: field["block"]
+                )
+            }
+        )
+        dfn = Dfn(
+            name=path.stem,
+            schema_version=Version("1"),
+            parent=try_parse_parent(meta),
+            advanced=is_advanced_package(meta),
+            multi=is_multi_package(meta),
+            blocks=blocks,
+        )
+    elif path.suffix == ".toml":
+        with path.open("rb") as file:
+            dfn = Dfn(**tomli.load(file))
+    return dfn
+
+
+def _load_common(path: str | PathLike) -> Fields:
+    common_path = Path(path).expanduser().resolve()
+    if not common_path.is_file():
+        return {}
+    common, _ = parse_dfn(common_path)
+    return common
+
+
+def load_all(dfndir: str | PathLike) -> Dfns:
+    """Load a MODFLOW 6 specification from definition files in a directory."""
+    exclude = ["common", "flopy"]
+    dfndir = Path(dfndir).expanduser().resolve()
+    dfns = {p.stem: p for p in dfndir.glob("*.dfn") if p.stem not in exclude}
+    tomls = {p.stem: p for p in dfndir.glob("*.toml") if p.stem not in exclude}
+    if dfns:
+        common = _load_common(dfndir / "common.dfn")
+        return {path.stem: load(path, common=common) for path in dfns.values()}
+    if tomls:
+        return {path.stem: load(path) for path in tomls.values()}
+
+
+def infer_tree(dfns: Dfns) -> Dfn:
+    """
+    Infer the MODFLOW 6 input component hierarchy from a flat spec:
+    unlinked DFNs, i.e. without `children` populated, only `parent`.
+
+    Returns the root component with children filled.
+    There must be exactly one root, i.e. component with no `parent`.
+
+    Assumes all DFNs are of the same schema version.
+    """
+
+    def drop_none_or_empty(path, key, value):
+        if value is None or value == "" or value == [] or value == {}:
+            return False
+        return True
+
+    def add_parent(dfn):
+        dfn = dfn.copy()
+        dfn_name = dfn["name"]
+        if dfn_name == "sim-nam":
+            # simulation name file
+            dfn.name = "sim"
+        elif dfn_name.endswith("-nam"):
+            # model name files
+            model_type = dfn_name[:-4]  # Remove "-nam"
+            dfn.name = model_type
+            dfn.parent = "sim"
+        elif (
+            dfn_name.startswith("exg-")
+            or dfn_name.startswith("sln-")
+            or dfn_name.startswith("utl-")
+        ):
+            # exchanges, solutions, standalone utilities
+            dfn.parent = "sim"
+        elif "-" in dfn_name:
+            # packages
+            model_type = dfn_name.split("-")[0]
+            dfn.parent = model_type
+
+        return remap(dfn, visit=drop_none_or_empty)
+
+    dfns = {name: add_parent(dfn) for name, dfn in dfns.items()}
+    first = next(iter(dfns.values()), None)
+    schema_version = first.schema_version if first else Version("1")
+
+    if schema_version == Version("1"):
+        raise NotImplementedError("Structure inference from v1 schema not implemented")
+    elif schema_version == Version("2"):
+        if (
+            len(
+                roots := [
+                    (name, dfn) for name, dfn in dfns.items() if dfn.parent is None
+                ]
+            )
+            != 1
+        ):
+            raise ValueError(f"Expected one root component, found {len(roots)}")
+
+        def get_children(node_name: str) -> Dfns:
+            return {name: dfn for name, dfn in dfns.items() if dfn.parent == node_name}
+
+        return Dfn(
+            name=(root_name := roots[0][0]),
+            blocks=dfns[root_name].blocks,
+            children=get_children(root_name),
+        )
+    raise ValueError(f"Unsupported schema version: {schema_version}. Expected 1 or 2.")
+
+
+def load_tree(dfndir: str | PathLike) -> Dfn:
+    """
+    Load a structured MODFLOW 6 specification from definition files in a directory.
+
+    A single root component definition (the simulation) is returned. This contains
+    child (and grandchild) components for the relevant models and packages.
+    """
+    return infer_tree(load_all(dfndir))
+
+
+__all__ = [
+    "SCALAR_TYPES",
+    "Block",
+    "Blocks",
+    "Dfn",
+    "Dfns",
+    "Field",
+    "FieldV1",
+    "FieldV2",
+    "Fields",
+    "Ref",
+    "infer_tree",
+    "load",
+    "load_all",
+    "load_tree",
+    "map",
+]
diff --git a/modflow_devtools/dfn/fetch.py b/modflow_devtools/dfn/fetch.py
new file mode 100644
index 00000000..34cdfa76
--- /dev/null
+++ b/modflow_devtools/dfn/fetch.py
@@ -0,0 +1,29 @@
+from os import PathLike
+from pathlib import Path
+from shutil import copytree
+from tempfile import TemporaryDirectory
+
+from modflow_devtools.download import download_and_unzip
+
+
+def fetch_dfns(
+    owner: str, repo: str, ref: str, outdir: str | PathLike, verbose: bool = False
+):
+    """Fetch definition files from the MODFLOW 6 repository."""
+    url = f"https://github.com/{owner}/{repo}/archive/{ref}.zip"
+    if verbose:
+        print(f"Downloading MODFLOW 6 repository archive from {url}")
+    with TemporaryDirectory() as tmp:
+        dl_path = download_and_unzip(url, Path(tmp), verbose=verbose)
+        contents = list(dl_path.glob("modflow6-*"))
+        proj_path = next(iter(contents), None)
+        if not proj_path:
+            raise ValueError(f"Missing proj dir in {dl_path}, found {contents}")
+        if verbose:
+            print("Copying dfns from download dir to output dir")
+        copytree(
+            proj_path / "doc" / "mf6io" / "mf6ivar" / "dfn", outdir, dirs_exist_ok=True
+        )
+
+
+get_dfns = fetch_dfns  # alias for backward compatibility
diff --git a/modflow_devtools/dfn/parse.py b/modflow_devtools/dfn/parse.py
new file mode 100644
index 00000000..589bdb29
--- /dev/null
+++ b/modflow_devtools/dfn/parse.py
@@ -0,0 +1,182 @@
+from ast import literal_eval
+from os import PathLike
+from pathlib import Path
+from typing import Any
+from warnings import warn
+
+from boltons.dictutils import OMD
+
+
+def field_attr_sort_key(item) -> int:
+    """
+    Sort key for input field attributes. The order is:
+    -1. block
+    0. name
+    1. type
+    2. shape
+    3. default
+    4. reader
+    5. optional
+    6. longname
+    7. description
+    """
+
+    k, _ = item
+    if k == "block":
+        return -1
+    if k == "name":
+        return 0
+    if k == "type":
+        return 1
+    if k == "shape":
+        return 2
+    if k == "default":
+        return 3
+    if k == "reader":
+        return 4
+    if k == "optional":
+        return 5
+    if k == "longname":
+        return 6
+    if k == "description":
+        return 7
+    return 8
+
+
+def try_parse_bool(value: Any) -> Any:
+    """
+    Try to parse a boolean from a string as represented
+    in a DFN file, otherwise return the value unaltered.
+    1. `"true"` -> `True`
+    2. `"false"` -> `False`
+    3. anything else -> `value`
+    """
+    if isinstance(value, str):
+        value = value.lower()
+        if value in ["true", "false"]:
+            return value == "true"
+    return value
+
+
+def try_parse_parent(meta: list[str]) -> str | None:
+    """
+    Try to parse a component's parent component name from its metadata.
+    Return `None` if it has no parent specified.
+    """
+    line = next(
+        iter(m for m in meta if isinstance(m, str) and m.startswith("parent")),
+        None,
+    )
+    if not line:
+        return None
+    split = line.split()
+    return split[1]
+
+
+def is_advanced_package(meta: list[str]) -> bool:
+    """Determine if the component is an advanced package from its metadata."""
+    return any("package-type advanced" in m for m in meta)
+
+
+def is_multi_package(meta: list[str]) -> bool:
+    """Determine if the component is a multi-package from its metadata."""
+    return any("multi-package" in m for m in meta)
+
+
+def parse_dfn(
+    path: str | PathLike,
+    common: dict | None = None,
+) -> tuple[OMD, list[str]]:
+    """
+    Parse a DFN file into an ordered dict of fields and a list of metadata.
+
+    Parameters
+    ----------
+    path : str | PathLike
+        Path to the DFN file to parse.
+    common : dict, optional
+        A dictionary of common variable definitions to use for
+        description substitutions, by default None.
+
+    Returns
+    -------
+    tuple[OMD, list[str]]
+        A tuple containing an ordered multi-dict of fields and a list of metadata.
+
+    Notes
+    -----
+    A DFN file consists of field definitions (each as a set of attributes) and a
+    number of comment lines either a) containing metadata about the component or
+    b) delimiting variables into blocks. This parser reads the file line-by-line
+    and saves component metadata and field attributes, ignoring block delimiters;
+    There is a `block` attribute on each field anyway so delimiters are unneeded.
+
+    The returned ordered multi-dict (OMD) maps names to dicts of their attributes,
+    with duplicate field names allowed. This is important because some DFN files
+    have fields with the same name defined multiple times for different purposes
+    (e.g., an `auxiliary` options block keyword, and column in the period block).
+
+    """
+
+    common = common or {}
+    field: dict = {}
+    fields: list = []
+    metadata: list = []
+
+    for line in Path(path).expanduser().resolve().open():
+        # parse metadata line
+        if (line := line.strip()).startswith("#"):
+            _, sep, tail = line.partition("flopy")
+            if sep == "flopy":
+                if (
+                    "multi-package" in tail
+                    or "solution_package" in tail
+                    or "subpackage" in tail
+                    or "parent" in tail
+                ):
+                    metadata.append(tail.strip())
+            _, sep, tail = line.partition("package-type")
+            if sep == "package-type":
+                metadata.append(f"package-type {tail.strip()}")
+            continue
+
+        # if we hit a newline and the field has attributes,
+        # we've reached the end of the field. Save it.
+        if not any(line):
+            if any(field):
+                fields.append((field["name"], field))
+                field = {}
+            continue
+
+        # parse field attribute
+        key, _, value = line.partition(" ")
+        if key == "default_value":
+            key = "default"
+        field[key] = value
+
+        # if this is the description attribute, substitute
+        # from common variable definitions if needed. drop
+        # backslashes too, TODO: generate/insert citations.
+        if key == "description":
+            descr = value.replace("\\", "").replace("``", "'").replace("''", "'")
+            _, replace, tail = descr.strip().partition("REPLACE")
+            if replace:
+                key, _, subs = tail.strip().partition(" ")
+                subs = literal_eval(subs)
+                cmmn = common.get(key, None)
+                if cmmn is None:
+                    warn(
+                        "Can't substitute description text, "
+                        f"common variable not found: {key}"
+                    )
+                else:
+                    descr = cmmn["description"]
+                    if any(subs):
+                        descr = descr.replace("\\", "").replace("{#1}", subs["{#1}"])
+            field["description"] = descr
+
+    # Save the last field if needed.
+    if any(field):
+        fields.append((field["name"], field))
+
+    return OMD(fields), metadata
diff --git a/modflow_devtools/dfn/schema/block.py b/modflow_devtools/dfn/schema/block.py
new file mode 100644
index 00000000..ed0f32af
--- /dev/null
+++ b/modflow_devtools/dfn/schema/block.py
@@ -0,0 +1,22 @@
+from collections.abc import Mapping
+
+from modflow_devtools.dfn.schema.field import Fields
+
+Block = Fields
+Blocks = Mapping[str, Block]
+
+
+def block_sort_key(item) -> int:
+    k, _ = item
+    if k == "options":
+        return 0
+    elif k == "dimensions":
+        return 1
+    elif k == "griddata":
+        return 2
+    elif k == "packagedata":
+        return 3
+    elif "period" in k:
+        return 4
+    else:
+        return 5
diff --git a/modflow_devtools/dfn/schema/field.py b/modflow_devtools/dfn/schema/field.py
new file mode 100644
index 00000000..f5ae8702
--- /dev/null
+++ b/modflow_devtools/dfn/schema/field.py
@@ -0,0 +1,39 @@
+from collections.abc import Mapping
+from dataclasses import dataclass
+from typing import Any, Literal
+
+SCALAR_TYPES = ("keyword", "integer", "double precision", "string")
+
+Fields = Mapping[str, "Field"]
+
+FieldType = Literal[
+    "keyword",
+    "integer",
+    "double precision",
+    "string",
+    "record",
+    "recarray",
+    "keystring",
+]
+
+
+Reader = Literal[
+    "urword",
+    "u1ddbl",
+    "u2ddbl",
+    "readarray",
+]
+
+
+@dataclass(kw_only=True)
+class Field:
+    name: str | None = None
+    type: FieldType | None = None
+    block: str | None = None
+    default: Any | None = None
+    description: str | None = None
+    children: Fields | None = None
+    optional: bool | None = None
+    reader: Reader = "urword"
+    shape: str | None = None
+    valid: tuple[str, ...] | None = None
diff --git a/modflow_devtools/dfn/schema/ref.py b/modflow_devtools/dfn/schema/ref.py
new file mode 100644
index 00000000..e9306a2f
--- /dev/null
+++ b/modflow_devtools/dfn/schema/ref.py
@@ -0,0 +1,13 @@
+from dataclasses import dataclass
+
+
+@dataclass
+class Ref:
+    """
+    A foreign-key-like reference between a file input variable
+    in a referring input component and another input component
+    referenced by it.
+    """
+
+    key: str  # name of file path field in referring component
+    tgt: str  # name of target component
diff --git a/modflow_devtools/dfn/schema/v1.py b/modflow_devtools/dfn/schema/v1.py
new file mode 100644
index 00000000..2d128594
--- /dev/null
+++ b/modflow_devtools/dfn/schema/v1.py
@@ -0,0 +1,22 @@
+from dataclasses import dataclass
+
+from modflow_devtools.dfn.schema.field import Field
+
+
+@dataclass(kw_only=True)
+class FieldV1(Field):
+    valid: tuple[str, ...] | None = None
+    tagged: bool | None = None
+    in_record: bool | None = None
+    layered: bool | None = None
+    longname: str | None = None
+    preserve_case: bool | None = None
+    numeric_index: bool | None = None
+    deprecated: bool = False
+    removed: bool = False
+    mf6internal: str | None = None
+
+    @classmethod
+    def from_dict(cls, d: dict) -> "FieldV1":
+        """Create a FieldV1 instance from a dictionary."""
+        return cls(**{k: v for k, v in d.items() if k in cls.__annotations__.keys()})
diff --git a/modflow_devtools/dfn/schema/v2.py b/modflow_devtools/dfn/schema/v2.py
new file mode 100644
index 00000000..f198a748
--- /dev/null
+++ b/modflow_devtools/dfn/schema/v2.py
@@ -0,0 +1,18 @@
+from dataclasses import dataclass
+from typing import Literal
+
+from modflow_devtools.dfn.schema.field import Field
+
+FieldType = Literal[
+    "keyword", "integer", "double", "string", "array", "record", "union"
+]
+
+
+@dataclass(kw_only=True)
+class FieldV2(Field):
+    type: FieldType
+
+    @classmethod
+    def from_dict(cls, d: dict) -> "FieldV2":
+        """Create a FieldV2 instance from a dictionary."""
+        return cls(**{k: v for k, v in d.items() if k in cls.__annotations__.keys()})
diff --git a/modflow_devtools/dfn2toml.py b/modflow_devtools/dfn2toml.py
index 7d346e6d..aebb0189 100644
--- a/modflow_devtools/dfn2toml.py
+++ b/modflow_devtools/dfn2toml.py
@@ -1,74 +1,35 @@
 """Convert DFNs to TOML."""
 
 import argparse
+from dataclasses import asdict
 from os import PathLike
 from pathlib import Path
 
 import tomli_w as tomli
-from boltons.iterutils import remap
 
-from modflow_devtools.dfn import Dfn
+from modflow_devtools.dfn import load_all, map
 
 # mypy: ignore-errors
 
 
-def convert(indir: PathLike, outdir: PathLike):
+def convert(indir: PathLike, outdir: PathLike, schema_version: str = "2") -> None:
     indir = Path(indir).expanduser().absolute()
     outdir = Path(outdir).expanduser().absolute()
     outdir.mkdir(exist_ok=True, parents=True)
-    for dfn in Dfn.load_all(indir).values():
-        dfn_name = dfn["name"]
-
-        # Determine new filename and parent relationship
-        if dfn_name == "sim-nam":
-            filename = "sim.toml"
-            dfn = dfn.copy()
-            dfn["name"] = "sim"
-            # No parent - this is root
-        elif dfn_name.endswith("-nam"):
-            # Model name files: gwf-nam -> gwf.toml, parent = "sim"
-            model_type = dfn_name[:-4]  # Remove "-nam"
-            filename = f"{model_type}.toml"
-            dfn = dfn.copy()
-            dfn["name"] = model_type
-            dfn["parent"] = "sim"
-        elif dfn_name.startswith("exg-"):
-            # Exchanges: parent = "sim"
-            filename = f"{dfn_name}.toml"
-            dfn = dfn.copy()
-            dfn["parent"] = "sim"
-        elif dfn_name.startswith("sln-"):
-            # Solutions: parent = "sim"
-            filename = f"{dfn_name}.toml"
-            dfn = dfn.copy()
-            dfn["parent"] = "sim"
-        elif dfn_name.startswith("utl-"):
-            # Utilities: parent = "sim"
-            filename = f"{dfn_name}.toml"
-            dfn = dfn.copy()
-            dfn["parent"] = "sim"
-        elif "-" in dfn_name:
-            # Packages: gwf-dis -> parent = "gwf"
-            model_type = dfn_name.split("-")[0]
-            filename = f"{dfn_name}.toml"
-            dfn = dfn.copy()
-            dfn["parent"] = model_type
-        else:
-            # Default case
-            filename = f"{dfn_name}.toml"
-
-        with Path.open(outdir / filename, "wb") as f:
-
-            def drop_none_or_empty(path, key, value):
-                if value is None or value == "" or value == [] or value == {}:
-                    return False
-                return True
-
-            tomli.dump(remap(dfn, visit=drop_none_or_empty), f)
+    dfns_in = load_all(indir)
+    dfns = {
+        name: map(dfn, schema_version=schema_version) for name, dfn in dfns_in.items()
+    }
+    for dfn_name, dfn in dfns.items():
+        with Path.open(outdir / f"{dfn_name}.toml", "wb") as f:
+            tomli.dump(asdict(dfn), f)
 
 
 if __name__ == "__main__":
-    """Convert DFN files to TOML."""
+    """
+    Convert DFN files in the original format and schema version (1)
+    to TOML files with a new schema version.
+    """
 
     parser = argparse.ArgumentParser(description="Convert DFN files to TOML.")
     parser.add_argument(
@@ -82,5 +43,12 @@ def drop_none_or_empty(path, key, value):
         "-o",
         help="Output directory.",
     )
+    parser.add_argument(
+        "--schema-version",
+        "-s",
+        type=str,
+        default="2",
+        help="Schema version to convert to.",
+    )
     args = parser.parse_args()
-    convert(args.indir, args.outdir)
+    convert(args.indir, args.outdir, args.schema_version)

From 5dd9e34546a010dc0cab329f8e0702ce956a42aa Mon Sep 17 00:00:00 2001
From: w-bonelli <wesbonelli@gmail.com>
Date: Wed, 8 Oct 2025 18:49:06 -0400
Subject: [PATCH 02/13] appease mypy

---
 modflow_devtools/dfn/__init__.py     | 107 +++++++++++++++------------
 modflow_devtools/dfn/parse.py        |   2 +-
 modflow_devtools/dfn/schema/field.py |   4 +-
 modflow_devtools/dfn/schema/v2.py    |   2 +-
 4 files changed, 62 insertions(+), 53 deletions(-)

diff --git a/modflow_devtools/dfn/__init__.py b/modflow_devtools/dfn/__init__.py
index 51bf5b2c..18fb5edb 100644
--- a/modflow_devtools/dfn/__init__.py
+++ b/modflow_devtools/dfn/__init__.py
@@ -9,6 +9,7 @@
 from pathlib import Path
 from typing import (
     Literal,
+    cast,
 )
 
 import tomli
@@ -16,7 +17,6 @@
 from boltons.iterutils import remap
 from packaging.version import Version
 
-import modflow_devtools.dfn.schema.v1 as v1_schema
 from modflow_devtools.dfn.parse import (
     is_advanced_package,
     is_multi_package,
@@ -31,6 +31,24 @@
 from modflow_devtools.dfn.schema.v2 import FieldV2
 from modflow_devtools.misc import try_literal_eval
 
+__all__ = [
+    "SCALAR_TYPES",
+    "Block",
+    "Blocks",
+    "Dfn",
+    "Dfns",
+    "Field",
+    "FieldV1",
+    "Fields",
+    "Ref",
+    "infer_tree",
+    "load",
+    "load_all",
+    "load_tree",
+    "map",
+]
+
+
 Format = Literal["dfn", "toml"]
 """DFN serialization format."""
 
@@ -56,15 +74,18 @@ class Dfn:
     @property
     def fields(self) -> Fields:
         """
-        Top-level fields in all blocks as a single dictionary.
+        A combined map of fields from all blocks.
 
-        Only top-level fields are included, i.e. subfields of records
-        or recarrays are not included.
+        Only top-level fields are included, no subfields of composites
+        such as records or recarrays.
         """
         fields = []
         for block in (self.blocks or {}).values():
             for field in block.values():
                 fields.append((field.name, field))
+
+        # for now return a multidict to support duplicate field names.
+        # TODO: change to normal dict after deprecating v1 schema
         return OMD(fields)
 
 
@@ -125,23 +146,23 @@ def map_field(dfn: Dfn, field: Field) -> Field:
         for a separate context will be given a reference to it.
         """
 
-        fields = dfn.fields
+        fields = cast(OMD, dfn.fields)
 
         def _map_field(_field) -> Field:
-            _field = asdict(_field)
+            field_dict = asdict(_field)
             # parse booleans from strings. everything else can
             # stay a string except default values, which we'll
             # try to parse as arbitrary literals below, and at
             # some point types, once we introduce type hinting
-            _field = {k: try_parse_bool(v) for k, v in _field.items()}
-            _name = _field.pop("name")
-            _type = _field.pop("type", None)
-            shape = _field.pop("shape", None)
+            field_dict = {k: try_parse_bool(v) for k, v in field_dict.items()}
+            _name = field_dict.pop("name")
+            _type = field_dict.pop("type", None)
+            shape = field_dict.pop("shape", None)
             shape = None if shape == "" else shape
-            block = _field.pop("block", None)
-            default = _field.pop("default", None)
+            block = field_dict.pop("block", None)
+            default = field_dict.pop("default", None)
             default = try_literal_eval(default) if _type != "string" else default
-            description = _field.pop("description", "")
+            description = field_dict.pop("description", "")
 
             def _row_field() -> Field:
                 """Parse a table's record (row) field"""
@@ -165,7 +186,7 @@ def _row_field() -> Field:
                     )
 
                 # implicit record with all scalar fields
-                if all(t in v1_schema._SCALAR_TYPES for t in item_types):
+                if all(t in SCALAR_TYPES for t in item_types):
                     return FieldV2.from_dict(
                         {
                             "name": _name,
@@ -175,7 +196,7 @@ def _row_field() -> Field:
                             "description": description.replace(
                                 "is the list of", "is the record of"
                             ),
-                            **_field,
+                            **field_dict,
                         }
                     )
 
@@ -186,6 +207,8 @@ def _row_field() -> Field:
                     if f.name in item_names and f.in_record
                 }
                 first = next(iter(children.values()))
+                if not first.type:
+                    raise ValueError(f"Missing type for field: {first.name}")
                 single = len(children) == 1
                 item_type = (
                     "keystring" if single and "keystring" in first.type else "record"
@@ -199,7 +222,7 @@ def _row_field() -> Field:
                         "description": description.replace(
                             "is the list of", f"is the {item_type} of"
                         ),
-                        **_field,
+                        **field_dict,
                     }
                 )
 
@@ -215,13 +238,13 @@ def _union_fields() -> Fields:
             def _record_fields() -> Fields:
                 """Parse a record's fields"""
                 names = _type.split()[1:]
-                children = {}
+                children: dict[str, Field] = {}
                 for name in names:
                     child = children.get(name, None)
                     if (
                         not child
-                        or not child.in_record
-                        or child.type.startswith("record")
+                        or not child.in_record  # type: ignore
+                        or child.type.startswith("record")  # type: ignore
                     ):
                         continue
                     children[name] = _map_field(child)
@@ -254,7 +277,7 @@ def _record_fields() -> Fields:
             # for now, we can tell a var is an array if its type
             # is scalar and it has a shape. once we have proper
             # typing, this can be read off the type itself.
-            elif shape is not None and _type not in v1_schema._SCALAR_TYPES:
+            elif shape is not None and _type not in SCALAR_TYPES:
                 raise TypeError(f"Unsupported array type: {_type}")
 
             else:
@@ -268,14 +291,15 @@ def _record_fields() -> Fields:
     def map_blocks(dfn: Dfn) -> Blocks:
         fields = {
             field.name: MapV1To2.map_field(dfn, field)
-            for field in dfn.fields.values(multi=True)
-            if not field.in_record
+            for field in cast(OMD, dfn.fields).values(multi=True)
+            if not field.in_record  # type: ignore
         }
-        blocks = {
+        block_dicts = {
             block_name: {f.name: f for f in block}
             for block_name, block in groupby(fields.values(), lambda f: f.block)
         }
-        if (period_block := blocks.get("period", None)) is not None:
+        blocks = {}
+        if (period_block := block_dicts.get("period", None)) is not None:
             blocks["period"] = MapV1To2.map_period_block(dfn, period_block)
 
         def remove_attrs(path, key, value):
@@ -287,7 +311,7 @@ def remove_attrs(path, key, value):
         return remap(blocks, visit=remove_attrs)
 
     def map(self, dfn: Dfn) -> Dfn:
-        if dfn.schema_version == Version("2"):
+        if dfn.schema_version == (v2 := Version("2")):
             return dfn
         return Dfn(
             name=dfn.name,
@@ -295,6 +319,7 @@ def map(self, dfn: Dfn) -> Dfn:
             multi=dfn.multi,
             ref=dfn.ref,
             blocks=MapV1To2.map_blocks(dfn),
+            schema_version=v2,
         )
 
 
@@ -305,10 +330,11 @@ def map(
     """Map a MODFLOW 6 specification to another schema version."""
     if dfn.schema_version == schema_version:
         return dfn
-    elif Version(schema_version) == Version("1"):
+    elif Version(str(schema_version)) == Version("1"):
         raise NotImplementedError("Mapping to schema version 1 is not implemented yet.")
-    elif Version(schema_version) == Version("2"):
+    elif Version(str(schema_version)) == Version("2"):
         return MapV1To2().map(dfn)
+    raise ValueError(f"Unsupported schema version: {schema_version}. Expected 1 or 2.")
 
 
 def load(f: str | PathLike, **kwargs) -> Dfn:
@@ -326,7 +352,7 @@ def load(f: str | PathLike, **kwargs) -> Dfn:
                 )
             }
         )
-        dfn = Dfn(
+        return Dfn(
             name=path.stem,
             schema_version=Version("1"),
             parent=try_parse_parent(meta),
@@ -336,8 +362,8 @@ def load(f: str | PathLike, **kwargs) -> Dfn:
         )
     elif path.suffix == ".toml":
         with path.open("rb") as file:
-            dfn = Dfn(**tomli.load(file))
-    return dfn
+            return Dfn(**tomli.load(file))
+    raise ValueError(f"Unsupported file type: {path.suffix}. Expected .dfn or .toml.")
 
 
 def _load_common(path: str | PathLike) -> Fields:
@@ -359,6 +385,7 @@ def load_all(dfndir: str | PathLike) -> Dfns:
         return {path.stem: load(path, common=common) for path in dfns.values()}
     if tomls:
         return {path.stem: load(path) for path in tomls.values()}
+    return {}  # TODO: raise instead?
 
 
 def infer_tree(dfns: Dfns) -> Dfn:
@@ -426,6 +453,7 @@ def get_children(node_name: str) -> Dfns:
             name=(root_name := roots[0][0]),
             blocks=dfns[root_name].blocks,
             children=get_children(root_name),
+            schema_version=schema_version,
         )
     raise ValueError(f"Unsupported schema version: {schema_version}. Expected 1 or 2.")
 
@@ -438,22 +466,3 @@ def load_tree(dfndir: str | PathLike) -> Dfn:
     child (and grandchild) components for the relevant models and packages.
     """
     return infer_tree(load_all(dfndir))
-
-
-__all__ = [
-    "SCALAR_TYPES",
-    "Block",
-    "Blocks",
-    "Dfn",
-    "Dfns",
-    "Field",
-    "FieldV1",
-    "FieldV2",
-    "Fields",
-    "Ref",
-    "infer_tree",
-    "load",
-    "load_all",
-    "load_tree",
-    "map",
-]
diff --git a/modflow_devtools/dfn/parse.py b/modflow_devtools/dfn/parse.py
index 589bdb29..9418c461 100644
--- a/modflow_devtools/dfn/parse.py
+++ b/modflow_devtools/dfn/parse.py
@@ -172,7 +172,7 @@ def parse_dfn(
                 else:
                     descr = cmmn["description"]
                     if any(subs):
-                        descr = descr.replace("\\", "").replace("{#1}", subs["{#1}"])
+                        descr = descr.replace("\\", "").replace("{#1}", subs["{#1}"])  # type: ignore
             field["description"] = descr
 
     # Save the last field if needed.
diff --git a/modflow_devtools/dfn/schema/field.py b/modflow_devtools/dfn/schema/field.py
index f5ae8702..d48bde68 100644
--- a/modflow_devtools/dfn/schema/field.py
+++ b/modflow_devtools/dfn/schema/field.py
@@ -27,8 +27,8 @@
 
 @dataclass(kw_only=True)
 class Field:
-    name: str | None = None
-    type: FieldType | None = None
+    name: str
+    type: str | None = None
     block: str | None = None
     default: Any | None = None
     description: str | None = None
diff --git a/modflow_devtools/dfn/schema/v2.py b/modflow_devtools/dfn/schema/v2.py
index f198a748..606a5aef 100644
--- a/modflow_devtools/dfn/schema/v2.py
+++ b/modflow_devtools/dfn/schema/v2.py
@@ -10,7 +10,7 @@
 
 @dataclass(kw_only=True)
 class FieldV2(Field):
-    type: FieldType
+    pass
 
     @classmethod
     def from_dict(cls, d: dict) -> "FieldV2":

From 5c268b6ad9c70f724dda07e1a4eef535ac785c47 Mon Sep 17 00:00:00 2001
From: w-bonelli <wesbonelli@gmail.com>
Date: Wed, 8 Oct 2025 20:21:33 -0400
Subject: [PATCH 03/13] start rewriting tests

---
 autotest/test_dfn.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/autotest/test_dfn.py b/autotest/test_dfn.py
index a1810968..a59a740e 100644
--- a/autotest/test_dfn.py
+++ b/autotest/test_dfn.py
@@ -2,7 +2,7 @@
 
 import pytest
 
-from modflow_devtools.dfn import Dfn
+from modflow_devtools.dfn import Dfn, load
 from modflow_devtools.dfn.fetch import fetch_dfns
 from modflow_devtools.dfn2toml import convert
 from modflow_devtools.markers import requires_pkg
@@ -45,8 +45,8 @@ def test_load_v1(dfn_name):
         (DFN_DIR / "common.dfn").open() as common_file,
         (DFN_DIR / f"{dfn_name}.dfn").open() as dfn_file,
     ):
-        common, _ = Dfn._load_v1_flat(common_file)
-        dfn = Dfn.load(dfn_file, name=dfn_name, common=common)
+        common, _ = load(common_file)
+        dfn = load(dfn_file, name=dfn_name, common=common)
         assert any(dfn)
 
 

From 79e78ad7f64e9e52bbc0130c911e31b6ee08e4b0 Mon Sep 17 00:00:00 2001
From: w-bonelli <wesbonelli@gmail.com>
Date: Thu, 9 Oct 2025 06:12:04 -0400
Subject: [PATCH 04/13] almost there

---
 autotest/test_dfn.py              | 83 +++++++++++++++----------------
 modflow_devtools/dfn/__init__.py  | 67 ++++++++++++-------------
 modflow_devtools/dfn/parse.py     | 13 ++---
 modflow_devtools/dfn/schema/v1.py |  3 +-
 modflow_devtools/dfn/schema/v2.py |  3 +-
 modflow_devtools/dfn2toml.py      |  8 ++-
 modflow_devtools/misc.py          | 10 ++++
 modflow_devtools/models.py        | 10 +---
 8 files changed, 100 insertions(+), 97 deletions(-)

diff --git a/autotest/test_dfn.py b/autotest/test_dfn.py
index a59a740e..50434e5c 100644
--- a/autotest/test_dfn.py
+++ b/autotest/test_dfn.py
@@ -2,7 +2,7 @@
 
 import pytest
 
-from modflow_devtools.dfn import Dfn, load
+from modflow_devtools.dfn import _load_common, load, load_all, load_tree
 from modflow_devtools.dfn.fetch import fetch_dfns
 from modflow_devtools.dfn2toml import convert
 from modflow_devtools.markers import requires_pkg
@@ -10,7 +10,7 @@
 PROJ_ROOT = Path(__file__).parents[1]
 DFN_DIR = PROJ_ROOT / "autotest" / "temp" / "dfn"
 TOML_DIR = DFN_DIR / "toml"
-VERSIONS = {1: DFN_DIR, 2: TOML_DIR}
+SPEC_DIRS = {1: DFN_DIR, 2: TOML_DIR}
 MF6_OWNER = "MODFLOW-ORG"
 MF6_REPO = "modflow6"
 MF6_REF = "develop"
@@ -30,12 +30,13 @@ def pytest_generate_tests(metafunc):
     if "toml_name" in metafunc.fixturenames:
         convert(DFN_DIR, TOML_DIR)
         dfn_paths = list(DFN_DIR.glob("*.dfn"))
-        assert all(
-            (TOML_DIR / f"{dfn.stem.replace('-nam', '')}.toml").is_file()
+        expected_toml_paths = [
+            TOML_DIR / f"{dfn.stem.replace('-nam', '')}.toml"
             for dfn in dfn_paths
             if "common" not in dfn.stem
-        )
+        ]
         toml_names = [toml.stem for toml in TOML_DIR.glob("*.toml")]
+        assert all(toml_path.exists() for toml_path in expected_toml_paths)
         metafunc.parametrize("toml_name", toml_names, ids=toml_names)
 
 
@@ -45,23 +46,24 @@ def test_load_v1(dfn_name):
         (DFN_DIR / "common.dfn").open() as common_file,
         (DFN_DIR / f"{dfn_name}.dfn").open() as dfn_file,
     ):
-        common, _ = load(common_file)
+        common, _ = _load_common(common_file)
         dfn = load(dfn_file, name=dfn_name, common=common)
-        assert any(dfn)
+        assert any(dfn.fields)
 
 
 @requires_pkg("boltons")
 def test_load_v2(toml_name):
     with (TOML_DIR / f"{toml_name}.toml").open(mode="rb") as toml_file:
-        toml = Dfn.load(toml_file, name=toml_name, version=2)
-        assert any(toml)
+        dfn = load(toml_file, name=toml_name, format="toml")
+        assert any(dfn.fields)
 
 
 @requires_pkg("boltons")
-@pytest.mark.parametrize("version", list(VERSIONS.keys()))
-def test_load_all(version):
-    dfns = Dfn.load_all(VERSIONS[version], version=version)
-    assert any(dfns)
+@pytest.mark.parametrize("schema_version", list(SPEC_DIRS.keys()))
+def test_load_all(schema_version):
+    path = SPEC_DIRS[schema_version]
+    dfns = load_all(path)
+    assert all(any(dfn.fields) for dfn in dfns.values())
 
 
 @requires_pkg("boltons")
@@ -90,37 +92,34 @@ def test_load_tree():
         assert gwf_data["name"] == "gwf"
         assert gwf_data["parent"] == "sim"
 
-        # Test hierarchy enforcement and completeness
-        dfns = Dfn.load_all(tmp_path, version=2)
-        roots = [name for name, dfn in dfns.items() if not dfn.get("parent")]
-        assert len(roots) == 1
-        assert roots[0] == "sim"
-
+        dfns = load_all(tmp_path)
+        root = load_tree(tmp_path)
+        roots = []
         for dfn in dfns.values():
-            parent = dfn.get("parent")
-            if parent:
-                assert parent in dfns
-
-        # Test tree building and navigation
-        tree = Dfn.load_tree(tmp_path, version=2)
-        assert "sim" in tree
-        assert tree["sim"]["name"] == "sim"
-
-        for model_type in ["gwf", "gwt", "gwe"]:
-            if model_type in tree["sim"]:
-                assert tree["sim"][model_type]["name"] == model_type
-                assert tree["sim"][model_type]["parent"] == "sim"
-
-        if "gwf" in tree["sim"]:
+            if dfn.parent:
+                assert dfn.parent in dfns
+            else:
+                roots.append(dfn.name)
+        assert len(roots) == 1
+        assert root.name == "sim"
+        assert root == roots[0]
+
+        model_types = ["gwf", "gwt", "gwe"]
+        models = root.children or {}
+        for model_type in model_types:
+            if model_type in models:
+                assert models[model_type].name == model_type
+                assert models[model_type].parent == "sim"
+
+        if "gwf" in models:
+            pkgs = models["gwf"].children or {}
             gwf_packages = [
-                k
-                for k in tree["sim"]["gwf"].keys()
-                if k.startswith("gwf-") and isinstance(tree["sim"]["gwf"][k], dict)
+                k for k in pkgs if k.startswith("gwf-") and isinstance(pkgs[k], dict)
             ]
             assert len(gwf_packages) > 0
 
-            if "gwf-dis" in tree["sim"]["gwf"]:
-                dis = tree["sim"]["gwf"]["gwf-dis"]
-                assert dis["name"] == "gwf-dis"
-                assert dis["parent"] == "gwf"
-                assert "options" in dis or "dimensions" in dis
+            if dis := pkgs.get("gwf-dis", None):
+                assert dis.name == "gwf-dis"
+                assert dis.parent == "gwf"
+                assert "options" in (dis.blocks or {})
+                assert "dimensions" in (dis.blocks or {})
diff --git a/modflow_devtools/dfn/__init__.py b/modflow_devtools/dfn/__init__.py
index 18fb5edb..5ef6d73d 100644
--- a/modflow_devtools/dfn/__init__.py
+++ b/modflow_devtools/dfn/__init__.py
@@ -257,7 +257,7 @@ def _record_fields() -> Fields:
                     "block": block,
                     "description": description,
                     "default": default,
-                    **_field,
+                    **field_dict,
                 }
             )
 
@@ -337,55 +337,52 @@ def map(
     raise ValueError(f"Unsupported schema version: {schema_version}. Expected 1 or 2.")
 
 
-def load(f: str | PathLike, **kwargs) -> Dfn:
+def load(f, name: str, format: str = "dfn", **kwargs) -> Dfn:
     """Load a MODFLOW 6 definition file."""
-    path = Path(f).expanduser().resolve()
-    if path.suffix == ".dfn":
-        fields, meta = parse_dfn(path, **kwargs)
-        blocks = (
-            {}
-            if "common" in path.stem
-            else {
-                block_name: {field["name"]: FieldV1.from_dict(field) for field in block}
-                for block_name, block in groupby(
-                    fields.values(), lambda field: field["block"]
-                )
-            }
-        )
+    if format == "dfn":
+        fields, meta = parse_dfn(f, **kwargs)
+        blocks = {
+            block_name: {field["name"]: FieldV1.from_dict(field) for field in block}
+            for block_name, block in groupby(
+                fields.values(), lambda field: field["block"]
+            )
+        }
         return Dfn(
-            name=path.stem,
+            name=name,
             schema_version=Version("1"),
             parent=try_parse_parent(meta),
             advanced=is_advanced_package(meta),
             multi=is_multi_package(meta),
             blocks=blocks,
         )
-    elif path.suffix == ".toml":
-        with path.open("rb") as file:
-            return Dfn(**tomli.load(file))
-    raise ValueError(f"Unsupported file type: {path.suffix}. Expected .dfn or .toml.")
+    elif format == "toml":
+        return Dfn(name=name, **tomli.load(f))
+    raise ValueError(f"Unsupported format: {format}. Expected 'dfn' or 'toml'.")
 
 
-def _load_common(path: str | PathLike) -> Fields:
-    common_path = Path(path).expanduser().resolve()
-    if not common_path.is_file():
-        return {}
-    common, _ = parse_dfn(common_path)
+def _load_common(f) -> Fields:
+    common, _ = parse_dfn(f)
     return common
 
 
-def load_all(dfndir: str | PathLike) -> Dfns:
+def load_all(path: str | PathLike) -> Dfns:
     """Load a MODFLOW 6 specification from definition files in a directory."""
     exclude = ["common", "flopy"]
-    dfndir = Path(dfndir).expanduser().resolve()
-    dfns = {p.stem: p for p in dfndir.glob("*.dfn") if p.stem not in exclude}
-    tomls = {p.stem: p for p in dfndir.glob("*.toml") if p.stem not in exclude}
-    if dfns:
-        common = _load_common(dfndir / "common.dfn")
-        return {path.stem: load(path, common=common) for path in dfns.values()}
-    if tomls:
-        return {path.stem: load(path) for path in tomls.values()}
-    return {}  # TODO: raise instead?
+    path = Path(path).expanduser().resolve()
+    dfn_paths = {p.stem: p for p in path.glob("*.dfn") if p.stem not in exclude}
+    toml_paths = {p.stem: p for p in path.glob("*.toml") if p.stem not in exclude}
+    dfns = {}
+    if dfn_paths:
+        with (path / "common.dfn").open() as f:
+            common = _load_common(f)
+        for dfn_name, dfn_path in dfn_paths.items():
+            with dfn_path.open() as f:
+                dfns[dfn_name] = load(f, name=dfn_name, common=common, format="dfn")
+    if toml_paths:
+        for toml_name, toml_path in toml_paths.items():
+            with toml_path.open() as f:
+                dfns[toml_name] = load(f, name=toml_name, format="toml")
+    return dfns
 
 
 def infer_tree(dfns: Dfns) -> Dfn:
diff --git a/modflow_devtools/dfn/parse.py b/modflow_devtools/dfn/parse.py
index 9418c461..5716d9cf 100644
--- a/modflow_devtools/dfn/parse.py
+++ b/modflow_devtools/dfn/parse.py
@@ -1,6 +1,4 @@
 from ast import literal_eval
-from os import PathLike
-from pathlib import Path
 from typing import Any
 from warnings import warn
 
@@ -83,17 +81,14 @@ def is_multi_package(meta: list[str]) -> bool:
     return any("multi-package" in m for m in meta)
 
 
-def parse_dfn(
-    path: str | PathLike,
-    common: dict | None = None,
-) -> tuple[OMD, list[str]]:
+def parse_dfn(f, common: dict | None = None) -> tuple[OMD, list[str]]:
     """
     Parse a DFN file into an ordered dict of fields and a list of metadata.
 
     Parameters
     ----------
-    path : str | PathLike
-        Path to the DFN file to parse.
+    f : readable file-like
+        A file-like object to read the DFN file from.
     common : dict, optional
         A dictionary of common variable definitions to use for
         description substitutions, by default None.
@@ -123,7 +118,7 @@ def parse_dfn(
     fields: list = []
     metadata: list = []
 
-    for line in Path(path).expanduser().resolve().open():
+    for line in f:
         # parse metadata line
         if (line := line.strip()).startswith("#"):
             _, sep, tail = line.partition("flopy")
diff --git a/modflow_devtools/dfn/schema/v1.py b/modflow_devtools/dfn/schema/v1.py
index 2d128594..5919881e 100644
--- a/modflow_devtools/dfn/schema/v1.py
+++ b/modflow_devtools/dfn/schema/v1.py
@@ -19,4 +19,5 @@ class FieldV1(Field):
     @classmethod
     def from_dict(cls, d: dict) -> "FieldV1":
         """Create a FieldV1 instance from a dictionary."""
-        return cls(**{k: v for k, v in d.items() if k in cls.__annotations__.keys()})
+        keys = list(cls.__annotations__.keys()) + list(Field.__annotations__.keys())
+        return cls(**{k: v for k, v in d.items() if k in keys})
diff --git a/modflow_devtools/dfn/schema/v2.py b/modflow_devtools/dfn/schema/v2.py
index 606a5aef..e13846cb 100644
--- a/modflow_devtools/dfn/schema/v2.py
+++ b/modflow_devtools/dfn/schema/v2.py
@@ -15,4 +15,5 @@ class FieldV2(Field):
     @classmethod
     def from_dict(cls, d: dict) -> "FieldV2":
         """Create a FieldV2 instance from a dictionary."""
-        return cls(**{k: v for k, v in d.items() if k in cls.__annotations__.keys()})
+        keys = list(cls.__annotations__.keys()) + list(Field.__annotations__.keys())
+        return cls(**{k: v for k, v in d.items() if k in keys})
diff --git a/modflow_devtools/dfn2toml.py b/modflow_devtools/dfn2toml.py
index aebb0189..0b16c1b3 100644
--- a/modflow_devtools/dfn2toml.py
+++ b/modflow_devtools/dfn2toml.py
@@ -6,8 +6,10 @@
 from pathlib import Path
 
 import tomli_w as tomli
+from boltons.iterutils import remap
 
 from modflow_devtools.dfn import load_all, map
+from modflow_devtools.misc import drop_none_or_empty
 
 # mypy: ignore-errors
 
@@ -22,7 +24,11 @@ def convert(indir: PathLike, outdir: PathLike, schema_version: str = "2") -> Non
     }
     for dfn_name, dfn in dfns.items():
         with Path.open(outdir / f"{dfn_name}.toml", "wb") as f:
-            tomli.dump(asdict(dfn), f)
+            dfn_dict = asdict(dfn)
+            # TODO if we start using c/attrs, swap
+            # this for a custom unstructuring hook
+            dfn_dict["schema_version"] = str(dfn_dict["schema_version"])
+            tomli.dump(remap(dfn_dict, visit=drop_none_or_empty), f)
 
 
 if __name__ == "__main__":
diff --git a/modflow_devtools/misc.py b/modflow_devtools/misc.py
index 65bf614b..5f36c46b 100644
--- a/modflow_devtools/misc.py
+++ b/modflow_devtools/misc.py
@@ -581,3 +581,13 @@ def try_literal_eval(value: str) -> Any:
         return literal_eval(value)
     except (SyntaxError, ValueError):
         return value
+
+
+def drop_none_or_empty(path, key, value):
+    """
+    Drop dictionary items with None or empty string values.
+    For use with `boltons.iterutils.remap`.
+    """
+    if value is None or value == "":
+        return False
+    return True
diff --git a/modflow_devtools/models.py b/modflow_devtools/models.py
index c2fc9b6e..1cafc9d7 100644
--- a/modflow_devtools/models.py
+++ b/modflow_devtools/models.py
@@ -21,13 +21,7 @@
 from pooch import Pooch
 
 import modflow_devtools
-from modflow_devtools.misc import get_model_paths
-
-
-def _drop_none_or_empty(path, key, value):
-    if value is None or value == "":
-        return False
-    return True
+from modflow_devtools.misc import drop_none_or_empty, get_model_paths
 
 
 def _model_sort_key(k) -> int:
@@ -421,7 +415,7 @@ def index(
 
         with self._registry_file_path.open("ab+") as registry_file:
             tomli_w.dump(
-                remap(dict(sorted(files.items())), visit=_drop_none_or_empty),
+                remap(dict(sorted(files.items())), visit=drop_none_or_empty),
                 registry_file,
             )
 

From 01837b66e79ec060070d8e83e5bc880a603e55c8 Mon Sep 17 00:00:00 2001
From: w-bonelli <wesbonelli@gmail.com>
Date: Thu, 9 Oct 2025 10:36:44 -0400
Subject: [PATCH 05/13] wip

---
 autotest/test_dfn.py             | 117 ++++++++++++++-----------------
 modflow_devtools/dfn/__init__.py | 111 ++++++++++++++++-------------
 modflow_devtools/dfn2toml.py     |   4 +-
 modflow_devtools/misc.py         |   5 +-
 4 files changed, 120 insertions(+), 117 deletions(-)

diff --git a/autotest/test_dfn.py b/autotest/test_dfn.py
index 50434e5c..63f7e2de 100644
--- a/autotest/test_dfn.py
+++ b/autotest/test_dfn.py
@@ -2,7 +2,7 @@
 
 import pytest
 
-from modflow_devtools.dfn import _load_common, load, load_all, load_tree
+from modflow_devtools.dfn import _load_common, load, load_all
 from modflow_devtools.dfn.fetch import fetch_dfns
 from modflow_devtools.dfn2toml import convert
 from modflow_devtools.markers import requires_pkg
@@ -29,14 +29,11 @@ def pytest_generate_tests(metafunc):
 
     if "toml_name" in metafunc.fixturenames:
         convert(DFN_DIR, TOML_DIR)
-        dfn_paths = list(DFN_DIR.glob("*.dfn"))
         expected_toml_paths = [
-            TOML_DIR / f"{dfn.stem.replace('-nam', '')}.toml"
-            for dfn in dfn_paths
-            if "common" not in dfn.stem
+            dfn for dfn in DFN_DIR.glob("*.dfn") if "common" not in dfn.stem
         ]
-        toml_names = [toml.stem for toml in TOML_DIR.glob("*.toml")]
         assert all(toml_path.exists() for toml_path in expected_toml_paths)
+        toml_names = [toml.stem for toml in TOML_DIR.glob("*.toml")]
         metafunc.parametrize("toml_name", toml_names, ids=toml_names)
 
 
@@ -47,7 +44,7 @@ def test_load_v1(dfn_name):
         (DFN_DIR / f"{dfn_name}.dfn").open() as dfn_file,
     ):
         common, _ = _load_common(common_file)
-        dfn = load(dfn_file, name=dfn_name, common=common)
+        dfn = load(dfn_file, name=dfn_name, format="dfn", common=common)
         assert any(dfn.fields)
 
 
@@ -61,65 +58,57 @@ def test_load_v2(toml_name):
 @requires_pkg("boltons")
 @pytest.mark.parametrize("schema_version", list(SPEC_DIRS.keys()))
 def test_load_all(schema_version):
-    path = SPEC_DIRS[schema_version]
-    dfns = load_all(path)
+    dfns = load_all(path=SPEC_DIRS[schema_version])
     assert all(any(dfn.fields) for dfn in dfns.values())
 
 
-@requires_pkg("boltons")
-def test_load_tree():
-    import tempfile
-
+@requires_pkg("boltons", "tomli")
+def test_convert(function_tmpdir):
     import tomli
 
-    with tempfile.TemporaryDirectory() as tmp_dir:
-        tmp_path = Path(tmp_dir)
-        convert(DFN_DIR, tmp_path)
-
-        # Test file conversion and naming
-        assert (tmp_path / "sim.toml").exists()
-        assert (tmp_path / "gwf.toml").exists()
-        assert not (tmp_path / "sim-nam.toml").exists()
-
-        # Test parent relationships in files
-        with (tmp_path / "sim.toml").open("rb") as f:
-            sim_data = tomli.load(f)
-        assert sim_data["name"] == "sim"
-        assert "parent" not in sim_data
-
-        with (tmp_path / "gwf.toml").open("rb") as f:
-            gwf_data = tomli.load(f)
-        assert gwf_data["name"] == "gwf"
-        assert gwf_data["parent"] == "sim"
-
-        dfns = load_all(tmp_path)
-        root = load_tree(tmp_path)
-        roots = []
-        for dfn in dfns.values():
-            if dfn.parent:
-                assert dfn.parent in dfns
-            else:
-                roots.append(dfn.name)
-        assert len(roots) == 1
-        assert root.name == "sim"
-        assert root == roots[0]
-
-        model_types = ["gwf", "gwt", "gwe"]
-        models = root.children or {}
-        for model_type in model_types:
-            if model_type in models:
-                assert models[model_type].name == model_type
-                assert models[model_type].parent == "sim"
-
-        if "gwf" in models:
-            pkgs = models["gwf"].children or {}
-            gwf_packages = [
-                k for k in pkgs if k.startswith("gwf-") and isinstance(pkgs[k], dict)
-            ]
-            assert len(gwf_packages) > 0
-
-            if dis := pkgs.get("gwf-dis", None):
-                assert dis.name == "gwf-dis"
-                assert dis.parent == "gwf"
-                assert "options" in (dis.blocks or {})
-                assert "dimensions" in (dis.blocks or {})
+    convert(DFN_DIR, function_tmpdir)
+
+    assert (function_tmpdir / "sim-nam.toml").exists()
+    assert (function_tmpdir / "gwf-nam.toml").exists()
+
+    with (function_tmpdir / "sim-nam.toml").open("rb") as f:
+        sim_data = tomli.load(f)
+    assert sim_data["name"] == "sim-nam"
+    assert sim_data["schema_version"] == "2"
+    assert "parent" not in sim_data
+
+    with (function_tmpdir / "gwf-nam.toml").open("rb") as f:
+        gwf_data = tomli.load(f)
+    assert gwf_data["name"] == "gwf-nam"
+    assert gwf_data["parent"] == "sim-nam"
+    assert gwf_data["schema_version"] == "2"
+
+    dfns = load_all(function_tmpdir)
+    roots = []
+    for dfn in dfns.values():
+        if dfn.parent:
+            assert dfn.parent in dfns
+        else:
+            roots.append(dfn.name)
+    assert len(roots) == 1
+    root = dfns[roots[0]]
+    assert root.name == "sim-nam"
+
+    models = root.children or {}
+    for mdl in models:
+        assert models[mdl].name == mdl
+        assert models[mdl].parent == "sim-nam"
+
+    if gwf := models.get("gwf-nam", None):
+        pkgs = gwf.children or {}
+        pkgs = {
+            k: v
+            for k, v in pkgs.items()
+            if k.startswith("gwf-") and isinstance(v, dict)
+        }
+        assert len(pkgs) > 0
+        if dis := pkgs.get("gwf-dis", None):
+            assert dis.name == "gwf-dis"
+            assert dis.parent == "gwf"
+            assert "options" in (dis.blocks or {})
+            assert "dimensions" in (dis.blocks or {})
diff --git a/modflow_devtools/dfn/__init__.py b/modflow_devtools/dfn/__init__.py
index 5ef6d73d..0888b391 100644
--- a/modflow_devtools/dfn/__init__.py
+++ b/modflow_devtools/dfn/__init__.py
@@ -29,7 +29,7 @@
 from modflow_devtools.dfn.schema.ref import Ref
 from modflow_devtools.dfn.schema.v1 import FieldV1
 from modflow_devtools.dfn.schema.v2 import FieldV2
-from modflow_devtools.misc import try_literal_eval
+from modflow_devtools.misc import drop_none_or_empty, try_literal_eval
 
 __all__ = [
     "SCALAR_TYPES",
@@ -41,6 +41,7 @@
     "FieldV1",
     "Fields",
     "Ref",
+    "flatten",
     "infer_tree",
     "load",
     "load_all",
@@ -62,8 +63,8 @@ class Dfn:
     MODFLOW 6 input component definition.
     """
 
-    name: str
     schema_version: Version
+    name: str
     parent: str | None = None
     advanced: bool = False
     multi: bool = False
@@ -313,6 +314,7 @@ def remove_attrs(path, key, value):
     def map(self, dfn: Dfn) -> Dfn:
         if dfn.schema_version == (v2 := Version("2")):
             return dfn
+
         return Dfn(
             name=dfn.name,
             advanced=dfn.advanced,
@@ -320,6 +322,7 @@ def map(self, dfn: Dfn) -> Dfn:
             ref=dfn.ref,
             blocks=MapV1To2.map_blocks(dfn),
             schema_version=v2,
+            parent=dfn.parent,
         )
 
 
@@ -396,63 +399,73 @@ def infer_tree(dfns: Dfns) -> Dfn:
     Assumes all DFNs are of the same schema version.
     """
 
-    def drop_none_or_empty(path, key, value):
-        if value is None or value == "" or value == [] or value == {}:
-            return False
-        return True
-
-    def add_parent(dfn):
-        dfn = dfn.copy()
-        dfn_name = dfn["name"]
-        if dfn_name == "sim-nam":
-            # simulation name file
-            dfn.name = "sim"
+    def set_parent(dfn):
+        dfn = asdict(dfn)
+        if (dfn_name := dfn["name"]) == "sim-nam":
+            pass
         elif dfn_name.endswith("-nam"):
-            # model name files
-            model_type = dfn_name[:-4]  # Remove "-nam"
-            dfn.name = model_type
-            dfn.parent = "sim"
+            dfn["parent"] = "sim-nam"
         elif (
             dfn_name.startswith("exg-")
             or dfn_name.startswith("sln-")
             or dfn_name.startswith("utl-")
         ):
-            # exchanges, solutions, standalone utilities
-            dfn.parent = "sim"
+            dfn["parent"] = "sim-nam"
         elif "-" in dfn_name:
-            # packages
-            model_type = dfn_name.split("-")[0]
-            dfn.parent = model_type
-
-        return remap(dfn, visit=drop_none_or_empty)
-
-    dfns = {name: add_parent(dfn) for name, dfn in dfns.items()}
-    first = next(iter(dfns.values()), None)
-    schema_version = first.schema_version if first else Version("1")
-
-    if schema_version == Version("1"):
-        raise NotImplementedError("Structure inference from v1 schema not implemented")
-    elif schema_version == Version("2"):
-        if (
-            len(
-                roots := [
-                    (name, dfn) for name, dfn in dfns.items() if dfn.parent is None
-                ]
+            mdl = dfn_name.split("-")[0]
+            dfn["parent"] = f"{mdl}-nam"
+
+        return Dfn(**remap(dfn, visit=drop_none_or_empty))
+
+    dfns = {name: set_parent(dfn) for name, dfn in dfns.items()}
+    first_dfn = next(iter(dfns.values()), None)
+    match schema_version := str(
+        first_dfn.schema_version if first_dfn else Version("1")
+    ):
+        case "1":
+            raise NotImplementedError("Tree inference from v1 schema not implemented")
+        case "2":
+            if (
+                nroots := len(
+                    roots := [
+                        (name, dfn) for name, dfn in dfns.items() if dfn.parent is None
+                    ]
+                )
+            ) != 1:
+                raise ValueError(f"Expected one root component, found {nroots}")
+
+            def get_children(node_name: str) -> Dfns:
+                return {
+                    name: dfn for name, dfn in dfns.items() if dfn.parent == node_name
+                }
+
+            return Dfn(
+                name=(root_name := roots[0][0]),
+                blocks=dfns[root_name].blocks,
+                children=get_children(root_name),
+                schema_version=Version(schema_version),
+            )
+        case _:
+            raise ValueError(
+                f"Unsupported schema version: {schema_version}. Expected 1 or 2."
             )
-            != 1
-        ):
-            raise ValueError(f"Expected one root component, found {len(roots)}")
 
-        def get_children(node_name: str) -> Dfns:
-            return {name: dfn for name, dfn in dfns.items() if dfn.parent == node_name}
 
-        return Dfn(
-            name=(root_name := roots[0][0]),
-            blocks=dfns[root_name].blocks,
-            children=get_children(root_name),
-            schema_version=schema_version,
-        )
-    raise ValueError(f"Unsupported schema version: {schema_version}. Expected 1 or 2.")
+def flatten(dfn: Dfn) -> Dfns:
+    """
+    Flatten a MODFLOW 6 input component hierarchy to a flat spec:
+    unlinked DFNs, i.e. without `children` populated, only `parent`.
+
+    Returns a dictionary of all components in the tree.
+    """
+
+    def _flatten(dfn: Dfn) -> Dfns:
+        dfns = {dfn.name: replace(dfn, children=None)}
+        for child in (dfn.children or {}).values():
+            dfns.update(_flatten(child))
+        return dfns
+
+    return _flatten(dfn)
 
 
 def load_tree(dfndir: str | PathLike) -> Dfn:
diff --git a/modflow_devtools/dfn2toml.py b/modflow_devtools/dfn2toml.py
index 0b16c1b3..d1b529c9 100644
--- a/modflow_devtools/dfn2toml.py
+++ b/modflow_devtools/dfn2toml.py
@@ -8,7 +8,7 @@
 import tomli_w as tomli
 from boltons.iterutils import remap
 
-from modflow_devtools.dfn import load_all, map
+from modflow_devtools.dfn import flatten, load_tree, map
 from modflow_devtools.misc import drop_none_or_empty
 
 # mypy: ignore-errors
@@ -18,7 +18,7 @@ def convert(indir: PathLike, outdir: PathLike, schema_version: str = "2") -> Non
     indir = Path(indir).expanduser().absolute()
     outdir = Path(outdir).expanduser().absolute()
     outdir.mkdir(exist_ok=True, parents=True)
-    dfns_in = load_all(indir)
+    dfns_in = flatten(load_tree(indir))
     dfns = {
         name: map(dfn, schema_version=schema_version) for name, dfn in dfns_in.items()
     }
diff --git a/modflow_devtools/misc.py b/modflow_devtools/misc.py
index 5f36c46b..38d2e25a 100644
--- a/modflow_devtools/misc.py
+++ b/modflow_devtools/misc.py
@@ -4,6 +4,7 @@
 import traceback
 from _warnings import warn
 from ast import literal_eval
+from collections.abc import Iterable
 from contextlib import contextmanager
 from enum import Enum
 from functools import wraps
@@ -585,9 +586,9 @@ def try_literal_eval(value: str) -> Any:
 
 def drop_none_or_empty(path, key, value):
     """
-    Drop dictionary items with None or empty string values.
+    Drop dictionary items with None or empty values.
     For use with `boltons.iterutils.remap`.
     """
-    if value is None or value == "":
+    if value is None or (isinstance(value, Iterable) and not any(value)):
         return False
     return True

From b161611c04502c928e5fcf5a4c8fabb917ee5703 Mon Sep 17 00:00:00 2001
From: wpbonelli <wpbonelli@gmail.com>
Date: Thu, 9 Oct 2025 11:17:39 -0400
Subject: [PATCH 06/13] more tests passing

---
 autotest/test_dfn.py             |  2 +-
 modflow_devtools/dfn/__init__.py | 11 ++++++++---
 modflow_devtools/dfn2toml.py     | 16 ++++++++++++----
 3 files changed, 21 insertions(+), 8 deletions(-)

diff --git a/autotest/test_dfn.py b/autotest/test_dfn.py
index 63f7e2de..3185fd17 100644
--- a/autotest/test_dfn.py
+++ b/autotest/test_dfn.py
@@ -43,7 +43,7 @@ def test_load_v1(dfn_name):
         (DFN_DIR / "common.dfn").open() as common_file,
         (DFN_DIR / f"{dfn_name}.dfn").open() as dfn_file,
     ):
-        common, _ = _load_common(common_file)
+        common = _load_common(common_file)
         dfn = load(dfn_file, name=dfn_name, format="dfn", common=common)
         assert any(dfn.fields)
 
diff --git a/modflow_devtools/dfn/__init__.py b/modflow_devtools/dfn/__init__.py
index 0888b391..48ebdbd2 100644
--- a/modflow_devtools/dfn/__init__.py
+++ b/modflow_devtools/dfn/__init__.py
@@ -340,9 +340,10 @@ def map(
     raise ValueError(f"Unsupported schema version: {schema_version}. Expected 1 or 2.")
 
 
-def load(f, name: str, format: str = "dfn", **kwargs) -> Dfn:
+def load(f, format: str = "dfn", **kwargs) -> Dfn:
     """Load a MODFLOW 6 definition file."""
     if format == "dfn":
+        name = kwargs.pop("name")
         fields, meta = parse_dfn(f, **kwargs)
         blocks = {
             block_name: {field["name"]: FieldV1.from_dict(field) for field in block}
@@ -359,7 +360,11 @@ def load(f, name: str, format: str = "dfn", **kwargs) -> Dfn:
             blocks=blocks,
         )
     elif format == "toml":
-        return Dfn(name=name, **tomli.load(f))
+        if (name := kwargs.pop("name", None)) is not None:
+            if name != (data := tomli.load(f)).pop("name", name):
+                raise ValueError(f"DFN name mismatch: {name} != {data.get('name')}")
+            return Dfn(name=name, **data)
+        return Dfn(**data)
     raise ValueError(f"Unsupported format: {format}. Expected 'dfn' or 'toml'.")
 
 
@@ -383,7 +388,7 @@ def load_all(path: str | PathLike) -> Dfns:
                 dfns[dfn_name] = load(f, name=dfn_name, common=common, format="dfn")
     if toml_paths:
         for toml_name, toml_path in toml_paths.items():
-            with toml_path.open() as f:
+            with toml_path.open("rb") as f:
                 dfns[toml_name] = load(f, name=toml_name, format="toml")
     return dfns
 
diff --git a/modflow_devtools/dfn2toml.py b/modflow_devtools/dfn2toml.py
index d1b529c9..3248b802 100644
--- a/modflow_devtools/dfn2toml.py
+++ b/modflow_devtools/dfn2toml.py
@@ -8,7 +8,7 @@
 import tomli_w as tomli
 from boltons.iterutils import remap
 
-from modflow_devtools.dfn import flatten, load_tree, map
+from modflow_devtools.dfn import flatten, map
 from modflow_devtools.misc import drop_none_or_empty
 
 # mypy: ignore-errors
@@ -18,10 +18,18 @@ def convert(indir: PathLike, outdir: PathLike, schema_version: str = "2") -> Non
     indir = Path(indir).expanduser().absolute()
     outdir = Path(outdir).expanduser().absolute()
     outdir.mkdir(exist_ok=True, parents=True)
-    dfns_in = flatten(load_tree(indir))
-    dfns = {
-        name: map(dfn, schema_version=schema_version) for name, dfn in dfns_in.items()
+
+    # Load all DFNs individually first, then map to target schema
+    from modflow_devtools.dfn import infer_tree, load_all
+
+    dfns_raw = load_all(indir)
+    dfns_mapped = {
+        name: map(dfn, schema_version=schema_version) for name, dfn in dfns_raw.items()
     }
+
+    # Now infer tree structure with mapped DFNs and flatten
+    tree = infer_tree(dfns_mapped)
+    dfns = flatten(tree)
     for dfn_name, dfn in dfns.items():
         with Path.open(outdir / f"{dfn_name}.toml", "wb") as f:
             dfn_dict = asdict(dfn)

From 0aab9c3eb0c4648043645609cf56a8dbd5282b96 Mon Sep 17 00:00:00 2001
From: wpbonelli <wpbonelli@gmail.com>
Date: Thu, 9 Oct 2025 11:42:16 -0400
Subject: [PATCH 07/13] passing

---
 autotest/test_dfn.py             |  8 +++---
 modflow_devtools/dfn/__init__.py | 45 ++++++++++++++++++++++++++++----
 modflow_devtools/dfn2toml.py     | 15 +++++++++--
 3 files changed, 58 insertions(+), 10 deletions(-)

diff --git a/autotest/test_dfn.py b/autotest/test_dfn.py
index 3185fd17..d7f11ce3 100644
--- a/autotest/test_dfn.py
+++ b/autotest/test_dfn.py
@@ -14,6 +14,7 @@
 MF6_OWNER = "MODFLOW-ORG"
 MF6_REPO = "modflow6"
 MF6_REF = "develop"
+EMPTY_DFNS = {"exg-gwfgwe", "exg-gwfgwt", "exg-gwfprt", "sln-ems"}
 
 
 def pytest_generate_tests(metafunc):
@@ -45,21 +46,22 @@ def test_load_v1(dfn_name):
     ):
         common = _load_common(common_file)
         dfn = load(dfn_file, name=dfn_name, format="dfn", common=common)
-        assert any(dfn.fields)
+        assert any(dfn.fields) == (dfn.name not in EMPTY_DFNS)
 
 
 @requires_pkg("boltons")
 def test_load_v2(toml_name):
     with (TOML_DIR / f"{toml_name}.toml").open(mode="rb") as toml_file:
         dfn = load(toml_file, name=toml_name, format="toml")
-        assert any(dfn.fields)
+        assert any(dfn.fields) == (dfn.name not in EMPTY_DFNS)
 
 
 @requires_pkg("boltons")
 @pytest.mark.parametrize("schema_version", list(SPEC_DIRS.keys()))
 def test_load_all(schema_version):
     dfns = load_all(path=SPEC_DIRS[schema_version])
-    assert all(any(dfn.fields) for dfn in dfns.values())
+    for dfn in dfns.values():
+        assert any(dfn.fields) == (dfn.name not in EMPTY_DFNS)
 
 
 @requires_pkg("boltons", "tomli")
diff --git a/modflow_devtools/dfn/__init__.py b/modflow_devtools/dfn/__init__.py
index 48ebdbd2..01a1355a 100644
--- a/modflow_devtools/dfn/__init__.py
+++ b/modflow_devtools/dfn/__init__.py
@@ -300,9 +300,16 @@ def map_blocks(dfn: Dfn) -> Blocks:
             for block_name, block in groupby(fields.values(), lambda f: f.block)
         }
         blocks = {}
+
+        # Handle period blocks specially
         if (period_block := block_dicts.get("period", None)) is not None:
             blocks["period"] = MapV1To2.map_period_block(dfn, period_block)
 
+        # Include all other blocks
+        for block_name, block_data in block_dicts.items():
+            if block_name != "period":  # Skip period since it's handled above
+                blocks[block_name] = block_data
+
         def remove_attrs(path, key, value):
             # remove unneeded variable attributes
             if key in ["in_record", "tagged", "preserve_case"]:
@@ -359,12 +366,40 @@ def load(f, format: str = "dfn", **kwargs) -> Dfn:
             multi=is_multi_package(meta),
             blocks=blocks,
         )
+
     elif format == "toml":
-        if (name := kwargs.pop("name", None)) is not None:
-            if name != (data := tomli.load(f)).pop("name", name):
-                raise ValueError(f"DFN name mismatch: {name} != {data.get('name')}")
-            return Dfn(name=name, **data)
-        return Dfn(**data)
+        data = tomli.load(f)
+
+        dfn_fields = {
+            "name": data.pop("name", kwargs.pop("name", None)),
+            "schema_version": Version(str(data.pop("schema_version", "2"))),
+            "parent": data.pop("parent", None),
+            "advanced": data.pop("advanced", False),
+            "multi": data.pop("multi", False),
+            "ref": data.pop("ref", None),
+        }
+
+        if (expected_name := kwargs.pop("name", None)) is not None:
+            if dfn_fields["name"] != expected_name:
+                raise ValueError(
+                    f"DFN name mismatch: {expected_name} != {dfn_fields['name']}"
+                )
+
+        blocks = {}
+        for section_name, section_data in data.items():
+            if isinstance(section_data, dict):
+                block_fields = {}
+                for field_name, field_data in section_data.items():
+                    if isinstance(field_data, dict):
+                        block_fields[field_name] = FieldV2.from_dict(field_data)
+                    else:
+                        block_fields[field_name] = field_data
+                blocks[section_name] = block_fields
+
+        dfn_fields["blocks"] = blocks if blocks else None
+
+        return Dfn(**dfn_fields)
+
     raise ValueError(f"Unsupported format: {format}. Expected 'dfn' or 'toml'.")
 
 
diff --git a/modflow_devtools/dfn2toml.py b/modflow_devtools/dfn2toml.py
index 3248b802..ba26239c 100644
--- a/modflow_devtools/dfn2toml.py
+++ b/modflow_devtools/dfn2toml.py
@@ -32,10 +32,21 @@ def convert(indir: PathLike, outdir: PathLike, schema_version: str = "2") -> Non
     dfns = flatten(tree)
     for dfn_name, dfn in dfns.items():
         with Path.open(outdir / f"{dfn_name}.toml", "wb") as f:
+            # TODO if we start using c/attrs, swap out
+            # all this for a custom unstructuring hook
             dfn_dict = asdict(dfn)
-            # TODO if we start using c/attrs, swap
-            # this for a custom unstructuring hook
             dfn_dict["schema_version"] = str(dfn_dict["schema_version"])
+
+            if dfn_dict.get("blocks"):
+                blocks = dfn_dict.pop("blocks")
+                for block_name, block_fields in blocks.items():
+                    # Create nested structure for each block
+                    if block_name not in dfn_dict:
+                        dfn_dict[block_name] = {}
+                    for field_name, field_data in block_fields.items():
+                        field_data.pop("children", None)
+                        dfn_dict[block_name][field_name] = field_data
+
             tomli.dump(remap(dfn_dict, visit=drop_none_or_empty), f)
 
 

From e2ea64f1fc502f2d7cd778e87541367ca66370ff Mon Sep 17 00:00:00 2001
From: wpbonelli <wpbonelli@gmail.com>
Date: Thu, 9 Oct 2025 11:50:47 -0400
Subject: [PATCH 08/13] appease mypy

---
 modflow_devtools/dfn/__init__.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/modflow_devtools/dfn/__init__.py b/modflow_devtools/dfn/__init__.py
index 01a1355a..5a1c25f1 100644
--- a/modflow_devtools/dfn/__init__.py
+++ b/modflow_devtools/dfn/__init__.py
@@ -394,7 +394,7 @@ def load(f, format: str = "dfn", **kwargs) -> Dfn:
                         block_fields[field_name] = FieldV2.from_dict(field_data)
                     else:
                         block_fields[field_name] = field_data
-                blocks[section_name] = block_fields
+                blocks[section_name] = block_fields # type: ignore
 
         dfn_fields["blocks"] = blocks if blocks else None
 

From 67a2bdbf7425d665dcd07e44a20b182cefbaea09 Mon Sep 17 00:00:00 2001
From: w-bonelli <wesbonelli@gmail.com>
Date: Thu, 9 Oct 2025 13:27:09 -0400
Subject: [PATCH 09/13] ruff

---
 modflow_devtools/dfn/__init__.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/modflow_devtools/dfn/__init__.py b/modflow_devtools/dfn/__init__.py
index 5a1c25f1..d4fa5bd0 100644
--- a/modflow_devtools/dfn/__init__.py
+++ b/modflow_devtools/dfn/__init__.py
@@ -394,7 +394,7 @@ def load(f, format: str = "dfn", **kwargs) -> Dfn:
                         block_fields[field_name] = FieldV2.from_dict(field_data)
                     else:
                         block_fields[field_name] = field_data
-                blocks[section_name] = block_fields # type: ignore
+                blocks[section_name] = block_fields  # type: ignore
 
         dfn_fields["blocks"] = blocks if blocks else None
 

From c9fcfc616ff917377555eee3e2106aec15409e5d Mon Sep 17 00:00:00 2001
From: w-bonelli <wesbonelli@gmail.com>
Date: Thu, 9 Oct 2025 13:34:44 -0400
Subject: [PATCH 10/13] cleanup

---
 autotest/test_dfn.py             |  6 +++---
 modflow_devtools/dfn/__init__.py | 24 +++++++++++++-----------
 modflow_devtools/dfn2toml.py     | 21 +++++++--------------
 3 files changed, 23 insertions(+), 28 deletions(-)

diff --git a/autotest/test_dfn.py b/autotest/test_dfn.py
index d7f11ce3..0611ee08 100644
--- a/autotest/test_dfn.py
+++ b/autotest/test_dfn.py
@@ -2,7 +2,7 @@
 
 import pytest
 
-from modflow_devtools.dfn import _load_common, load, load_all
+from modflow_devtools.dfn import _load_common, load, load_flat
 from modflow_devtools.dfn.fetch import fetch_dfns
 from modflow_devtools.dfn2toml import convert
 from modflow_devtools.markers import requires_pkg
@@ -59,7 +59,7 @@ def test_load_v2(toml_name):
 @requires_pkg("boltons")
 @pytest.mark.parametrize("schema_version", list(SPEC_DIRS.keys()))
 def test_load_all(schema_version):
-    dfns = load_all(path=SPEC_DIRS[schema_version])
+    dfns = load_flat(path=SPEC_DIRS[schema_version])
     for dfn in dfns.values():
         assert any(dfn.fields) == (dfn.name not in EMPTY_DFNS)
 
@@ -85,7 +85,7 @@ def test_convert(function_tmpdir):
     assert gwf_data["parent"] == "sim-nam"
     assert gwf_data["schema_version"] == "2"
 
-    dfns = load_all(function_tmpdir)
+    dfns = load_flat(function_tmpdir)
     roots = []
     for dfn in dfns.values():
         if dfn.parent:
diff --git a/modflow_devtools/dfn/__init__.py b/modflow_devtools/dfn/__init__.py
index d4fa5bd0..188a27d3 100644
--- a/modflow_devtools/dfn/__init__.py
+++ b/modflow_devtools/dfn/__init__.py
@@ -41,12 +41,12 @@
     "FieldV1",
     "Fields",
     "Ref",
-    "flatten",
-    "infer_tree",
     "load",
-    "load_all",
+    "load_flat",
     "load_tree",
     "map",
+    "to_flat",
+    "to_tree",
 ]
 
 
@@ -408,7 +408,7 @@ def _load_common(f) -> Fields:
     return common
 
 
-def load_all(path: str | PathLike) -> Dfns:
+def load_flat(path: str | PathLike) -> Dfns:
     """Load a MODFLOW 6 specification from definition files in a directory."""
     exclude = ["common", "flopy"]
     path = Path(path).expanduser().resolve()
@@ -428,15 +428,17 @@ def load_all(path: str | PathLike) -> Dfns:
     return dfns
 
 
-def infer_tree(dfns: Dfns) -> Dfn:
+def to_tree(dfns: Dfns) -> Dfn:
     """
     Infer the MODFLOW 6 input component hierarchy from a flat spec:
     unlinked DFNs, i.e. without `children` populated, only `parent`.
 
-    Returns the root component with children filled.
-    There must be exactly one root, i.e. component with no `parent`.
+    Returns the root component. There must be exactly one root, i.e.
+    component with no `parent`. Composite components have `children`
+    populated.
 
-    Assumes all DFNs are of the same schema version.
+    Assumes DFNs are already in v2 schema, just lacking parent-child
+    links; before calling this function, map them first with `map()`.
     """
 
     def set_parent(dfn):
@@ -491,12 +493,12 @@ def get_children(node_name: str) -> Dfns:
             )
 
 
-def flatten(dfn: Dfn) -> Dfns:
+def to_flat(dfn: Dfn) -> Dfns:
     """
     Flatten a MODFLOW 6 input component hierarchy to a flat spec:
     unlinked DFNs, i.e. without `children` populated, only `parent`.
 
-    Returns a dictionary of all components in the tree.
+    Returns a dictionary of all components in the specification.
     """
 
     def _flatten(dfn: Dfn) -> Dfns:
@@ -515,4 +517,4 @@ def load_tree(dfndir: str | PathLike) -> Dfn:
     A single root component definition (the simulation) is returned. This contains
     child (and grandchild) components for the relevant models and packages.
     """
-    return infer_tree(load_all(dfndir))
+    return to_tree(load_flat(dfndir))
diff --git a/modflow_devtools/dfn2toml.py b/modflow_devtools/dfn2toml.py
index ba26239c..450aae6c 100644
--- a/modflow_devtools/dfn2toml.py
+++ b/modflow_devtools/dfn2toml.py
@@ -8,7 +8,7 @@
 import tomli_w as tomli
 from boltons.iterutils import remap
 
-from modflow_devtools.dfn import flatten, map
+from modflow_devtools.dfn import load_flat, map, to_flat, to_tree
 from modflow_devtools.misc import drop_none_or_empty
 
 # mypy: ignore-errors
@@ -19,28 +19,21 @@ def convert(indir: PathLike, outdir: PathLike, schema_version: str = "2") -> Non
     outdir = Path(outdir).expanduser().absolute()
     outdir.mkdir(exist_ok=True, parents=True)
 
-    # Load all DFNs individually first, then map to target schema
-    from modflow_devtools.dfn import infer_tree, load_all
-
-    dfns_raw = load_all(indir)
-    dfns_mapped = {
-        name: map(dfn, schema_version=schema_version) for name, dfn in dfns_raw.items()
+    dfns = {
+        name: map(dfn, schema_version=schema_version)
+        for name, dfn in load_flat(indir).items()
     }
-
-    # Now infer tree structure with mapped DFNs and flatten
-    tree = infer_tree(dfns_mapped)
-    dfns = flatten(tree)
-    for dfn_name, dfn in dfns.items():
+    tree = to_tree(dfns)
+    flat = to_flat(tree)
+    for dfn_name, dfn in flat.items():
         with Path.open(outdir / f"{dfn_name}.toml", "wb") as f:
             # TODO if we start using c/attrs, swap out
             # all this for a custom unstructuring hook
             dfn_dict = asdict(dfn)
             dfn_dict["schema_version"] = str(dfn_dict["schema_version"])
-
             if dfn_dict.get("blocks"):
                 blocks = dfn_dict.pop("blocks")
                 for block_name, block_fields in blocks.items():
-                    # Create nested structure for each block
                     if block_name not in dfn_dict:
                         dfn_dict[block_name] = {}
                     for field_name, field_data in block_fields.items():

From ee304efc6f8ef640f46921a9fda1cc971068594e Mon Sep 17 00:00:00 2001
From: w-bonelli <wesbonelli@gmail.com>
Date: Thu, 9 Oct 2025 13:49:23 -0400
Subject: [PATCH 11/13] fix

---
 modflow_devtools/dfn/__init__.py | 49 +++++++++++++++-----------------
 modflow_devtools/dfn2toml.py     | 12 ++++++--
 2 files changed, 33 insertions(+), 28 deletions(-)

diff --git a/modflow_devtools/dfn/__init__.py b/modflow_devtools/dfn/__init__.py
index 188a27d3..58b952dc 100644
--- a/modflow_devtools/dfn/__init__.py
+++ b/modflow_devtools/dfn/__init__.py
@@ -188,16 +188,17 @@ def _row_field() -> Field:
 
                 # implicit record with all scalar fields
                 if all(t in SCALAR_TYPES for t in item_types):
+                    children = _record_fields()
                     return FieldV2.from_dict(
                         {
+                            **field_dict,
                             "name": _name,
                             "type": "record",
                             "block": block,
-                            "children": _record_fields(),
+                            "children": children,
                             "description": description.replace(
                                 "is the list of", "is the record of"
                             ),
-                            **field_dict,
                         }
                     )
 
@@ -239,17 +240,13 @@ def _union_fields() -> Fields:
             def _record_fields() -> Fields:
                 """Parse a record's fields"""
                 names = _type.split()[1:]
-                children: dict[str, Field] = {}
-                for name in names:
-                    child = children.get(name, None)
-                    if (
-                        not child
-                        or not child.in_record  # type: ignore
-                        or child.type.startswith("record")  # type: ignore
-                    ):
-                        continue
-                    children[name] = _map_field(child)
-                return children
+                return {
+                    f.name: _map_field(f)
+                    for f in fields.values(multi=True)
+                    if f.name in names
+                    and f.in_record
+                    and not f.type.startswith("record")
+                }
 
             _field = FieldV2.from_dict(
                 {
@@ -305,9 +302,8 @@ def map_blocks(dfn: Dfn) -> Blocks:
         if (period_block := block_dicts.get("period", None)) is not None:
             blocks["period"] = MapV1To2.map_period_block(dfn, period_block)
 
-        # Include all other blocks
         for block_name, block_data in block_dicts.items():
-            if block_name != "period":  # Skip period since it's handled above
+            if block_name != "period":
                 blocks[block_name] = block_data
 
         def remove_attrs(path, key, value):
@@ -469,24 +465,25 @@ def set_parent(dfn):
         case "2":
             if (
                 nroots := len(
-                    roots := [
-                        (name, dfn) for name, dfn in dfns.items() if dfn.parent is None
-                    ]
+                    roots := {
+                        name: dfn for name, dfn in dfns.items() if dfn.parent is None
+                    }
                 )
             ) != 1:
                 raise ValueError(f"Expected one root component, found {nroots}")
 
-            def get_children(node_name: str) -> Dfns:
-                return {
+            def _build_tree(node_name: str) -> Dfn:
+                node = dfns[node_name]
+                children = {
                     name: dfn for name, dfn in dfns.items() if dfn.parent == node_name
                 }
+                if any(children):
+                    node.children = {
+                        name: _build_tree(name) for name in children.keys()
+                    }
+                return node
 
-            return Dfn(
-                name=(root_name := roots[0][0]),
-                blocks=dfns[root_name].blocks,
-                children=get_children(root_name),
-                schema_version=Version(schema_version),
-            )
+            return _build_tree(next(iter(roots.keys())))
         case _:
             raise ValueError(
                 f"Unsupported schema version: {schema_version}. Expected 1 or 2."
diff --git a/modflow_devtools/dfn2toml.py b/modflow_devtools/dfn2toml.py
index 450aae6c..db7d5eaf 100644
--- a/modflow_devtools/dfn2toml.py
+++ b/modflow_devtools/dfn2toml.py
@@ -9,6 +9,7 @@
 from boltons.iterutils import remap
 
 from modflow_devtools.dfn import load_flat, map, to_flat, to_tree
+from modflow_devtools.dfn.schema.block import block_sort_key
 from modflow_devtools.misc import drop_none_or_empty
 
 # mypy: ignore-errors
@@ -37,10 +38,17 @@ def convert(indir: PathLike, outdir: PathLike, schema_version: str = "2") -> Non
                     if block_name not in dfn_dict:
                         dfn_dict[block_name] = {}
                     for field_name, field_data in block_fields.items():
-                        field_data.pop("children", None)
                         dfn_dict[block_name][field_name] = field_data
 
-            tomli.dump(remap(dfn_dict, visit=drop_none_or_empty), f)
+            tomli.dump(
+                dict(
+                    sorted(
+                        remap(dfn_dict, visit=drop_none_or_empty).items(),
+                        key=block_sort_key,
+                    )
+                ),
+                f,
+            )
 
 
 if __name__ == "__main__":

From 01c84f765f5517d91a2e28dce42478bbde86441e Mon Sep 17 00:00:00 2001
From: w-bonelli <wesbonelli@gmail.com>
Date: Thu, 9 Oct 2025 14:26:05 -0400
Subject: [PATCH 12/13] all

---
 modflow_devtools/dfn/__init__.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/modflow_devtools/dfn/__init__.py b/modflow_devtools/dfn/__init__.py
index 58b952dc..6f966dd9 100644
--- a/modflow_devtools/dfn/__init__.py
+++ b/modflow_devtools/dfn/__init__.py
@@ -39,6 +39,7 @@
     "Dfns",
     "Field",
     "FieldV1",
+    "FieldV2",
     "Fields",
     "Ref",
     "load",

From dbad9ac72229c0ad226530fd844e9b37638153e7 Mon Sep 17 00:00:00 2001
From: w-bonelli <wesbonelli@gmail.com>
Date: Thu, 9 Oct 2025 14:29:11 -0400
Subject: [PATCH 13/13] docstrings

---
 modflow_devtools/dfn/__init__.py | 27 ++++++++++++++++-----------
 1 file changed, 16 insertions(+), 11 deletions(-)

diff --git a/modflow_devtools/dfn/__init__.py b/modflow_devtools/dfn/__init__.py
index 6f966dd9..c532d099 100644
--- a/modflow_devtools/dfn/__init__.py
+++ b/modflow_devtools/dfn/__init__.py
@@ -406,7 +406,12 @@ def _load_common(f) -> Fields:
 
 
 def load_flat(path: str | PathLike) -> Dfns:
-    """Load a MODFLOW 6 specification from definition files in a directory."""
+    """
+    Load a flat MODFLOW 6 specification from definition files in a directory.
+
+    Returns a dictionary of unlinked DFNs, i.e. without `children` populated.
+    Components will have `parent` populated if the schema is v2 but not if v1.
+    """
     exclude = ["common", "flopy"]
     path = Path(path).expanduser().resolve()
     dfn_paths = {p.stem: p for p in path.glob("*.dfn") if p.stem not in exclude}
@@ -425,6 +430,16 @@ def load_flat(path: str | PathLike) -> Dfns:
     return dfns
 
 
+def load_tree(path: str | PathLike) -> Dfn:
+    """
+    Load a structured MODFLOW 6 specification from definition files in a directory.
+
+    A single root component definition (the simulation) is returned. This contains
+    child (and grandchild) components for the relevant models and packages.
+    """
+    return to_tree(load_flat(path))
+
+
 def to_tree(dfns: Dfns) -> Dfn:
     """
     Infer the MODFLOW 6 input component hierarchy from a flat spec:
@@ -506,13 +521,3 @@ def _flatten(dfn: Dfn) -> Dfns:
         return dfns
 
     return _flatten(dfn)
-
-
-def load_tree(dfndir: str | PathLike) -> Dfn:
-    """
-    Load a structured MODFLOW 6 specification from definition files in a directory.
-
-    A single root component definition (the simulation) is returned. This contains
-    child (and grandchild) components for the relevant models and packages.
-    """
-    return to_tree(load_flat(dfndir))