efficient build

- postpone building until really needed - rebuild only if artifacts change - no build on source update - prune takes current resolver state instead of global var
2022-04-13 15:41:57 +02:00
parent 8ae5376d41
commit 1d9629566c
8 changed files with 302 additions and 270 deletions
--- a/lektor_groupby/watcher.py
+++ b/lektor_groupby/watcher.py
@@ -1,27 +1,17 @@
-from lektor.db import Database, Record  # typing
-from lektor.types.flow import Flow, FlowType
-from lektor.utils import bool_from_string
-
-from typing import Set, Dict, List, Tuple, Any, Union, NamedTuple
+from typing import TYPE_CHECKING, Dict, List, Tuple, Any, Union, NamedTuple
 from typing import Optional, Callable, Iterator, Generator
-from .vobj import GroupBySource
-from .config import Config
+from .model import ModelReader
 from .util import most_used_key
-
-
-# -----------------------------------
-#              Typing
-# -----------------------------------
-
-class FieldKeyPath(NamedTuple):
-    fieldKey: str
-    flowIndex: Optional[int] = None
-    flowKey: Optional[str] = None
+from .vobj import GroupBySource
+if TYPE_CHECKING:
+    from lektor.db import Database, Record
+    from .config import Config
+    from .model import FieldKeyPath


 class GroupByCallbackArgs(NamedTuple):
-    record: Record
-    key: FieldKeyPath
+    record: 'Record'
+    key: 'FieldKeyPath'
    field: Any  # lektor model data-field value


@@ -31,83 +21,15 @@ GroupingCallback = Callable[[GroupByCallbackArgs], Union[
 ]]


-# -----------------------------------
-#            ModelReader
-# -----------------------------------
-
-class GroupByModelReader:
-    ''' Find models and flow-models which contain attribute '''
-
-    def __init__(self, db: Database, attrib: str) -> None:
-        self._flows = {}  # type: Dict[str, Set[str]]
-        self._models = {}  # type: Dict[str, Dict[str, str]]
-        # find flow blocks containing attribute
-        for key, flow in db.flowblocks.items():
-            tmp1 = set(f.name for f in flow.fields
-                       if bool_from_string(f.options.get(attrib, False)))
-            if tmp1:
-                self._flows[key] = tmp1
-        # find models and flow-blocks containing attribute
-        for key, model in db.datamodels.items():
-            tmp2 = {}  # Dict[str, str]
-            for field in model.fields:
-                if bool_from_string(field.options.get(attrib, False)):
-                    tmp2[field.name] = '*'  # include all children
-                elif isinstance(field.type, FlowType) and self._flows:
-                    # only processed if at least one flow has attrib
-                    fbs = field.type.flow_blocks
-                    # if fbs == None, all flow-blocks are allowed
-                    if fbs is None or any(x in self._flows for x in fbs):
-                        tmp2[field.name] = '?'  # only some flow blocks
-            if tmp2:
-                self._models[key] = tmp2
-
-    def read(
-        self,
-        record: Record,
-        flatten: bool = False
-    ) -> Iterator[Tuple[FieldKeyPath, Any]]:
-        '''
-        Enumerate all fields of a Record with attrib = True.
-        Flows are either returned directly (flatten=False) or
-        expanded so that each flow-block is yielded (flatten=True)
-        '''
-        assert isinstance(record, Record)
-        for r_key, subs in self._models.get(record.datamodel.id, {}).items():
-            field = record[r_key]
-            if not field:
-                continue
-            if subs == '*':  # either normal field or flow type (all blocks)
-                if flatten and isinstance(field, Flow):
-                    for i, flow in enumerate(field.blocks):
-                        flowtype = flow['_flowblock']
-                        for f_key, block in flow._data.items():
-                            if f_key.startswith('_'):  # e.g., _flowblock
-                                continue
-                            yield FieldKeyPath(r_key, i, f_key), block
-                else:
-                    yield FieldKeyPath(r_key), field
-            else:  # always flow type (only some blocks)
-                for i, flow in enumerate(field.blocks):
-                    flowtype = flow['_flowblock']
-                    for f_key in self._flows.get(flowtype, []):
-                        yield FieldKeyPath(r_key, i, f_key), flow[f_key]
-
-
-# -----------------------------------
-#              Watcher
-# -----------------------------------
-
 class Watcher:
    '''
    Callback is called with (Record, FieldKeyPath, field-value).
    Callback may yield one or more (group, extra-info) tuples.
    '''

-    def __init__(self, config: Config) -> None:
+    def __init__(self, config: 'Config') -> None:
        self.config = config
-        self.flatten = True
-        self.callback = None  # type: GroupingCallback #type:ignore[assignment]
+        self._root = self.config.root

    def grouping(self, flatten: bool = True) \
            -> Callable[[GroupingCallback], None]:
@@ -122,28 +44,23 @@ class Watcher:
            self.callback = fn
        return _decorator

-    def initialize(self, db: Database) -> None:
+    def initialize(self, db: 'Database') -> None:
        ''' Reset internal state. You must initialize before each build! '''
        assert callable(self.callback), 'No grouping callback provided.'
-        self._root = self.config.root
-        self._model_reader = GroupByModelReader(db, attrib=self.config.key)
+        self._model_reader = ModelReader(db, self.config.key, self.flatten)
        self._state = {}  # type: Dict[str, Dict[Record, List[Any]]]
        self._group_map = {}  # type: Dict[str, List[str]]
-        self._processed = set()  # type: Set[str]

-    def should_process(self, node: Record) -> bool:
+    def should_process(self, node: 'Record') -> bool:
        ''' Check if record path is being watched. '''
        return node['_path'].startswith(self._root)

-    def process(self, record: Record) -> None:
+    def process(self, record: 'Record') -> None:
        '''
        Will iterate over all record fields and call the callback method.
        Each record is guaranteed to be processed only once.
        '''
-        if record.path in self._processed:
-            return
-        self._processed.add(record.path)
-        for key, field in self._model_reader.read(record, self.flatten):
+        for key, field in self._model_reader.read(record):
            _gen = self.callback(GroupByCallbackArgs(record, key, field))
            try:
                obj = next(_gen)
@@ -161,10 +78,11 @@ class Watcher:

    def _persist(
        self,
-        record: Record,
-        key: FieldKeyPath,
+        record: 'Record',
+        key: 'FieldKeyPath',
        obj: Union[str, tuple]
    ) -> str:
+        ''' Update internal state. Return slugified string. '''
        group = obj if isinstance(obj, str) else obj[0]
        slug = self.config.slugify(group)
        # init group-key
@@ -176,14 +94,14 @@ class Watcher:
        # init group extras
        if record not in self._state[slug]:
            self._state[slug][record] = []
-        # (optional) append extra
+        # append extras (or default value)
        if isinstance(obj, tuple):
            self._state[slug][record].append(obj[1])
        else:
-            self._state[slug][record].append(key.flowKey or key.fieldKey)
+            self._state[slug][record].append(key.fieldKey)
        return slug

-    def iter_sources(self, root: Record) -> Iterator[GroupBySource]:
+    def iter_sources(self, root: 'Record') -> Iterator[GroupBySource]:
        ''' Prepare and yield GroupBySource elements. '''
        for key, children in self._state.items():
            group = most_used_key(self._group_map[key])
@@ -192,7 +110,6 @@ class Watcher:
        del self._model_reader
        del self._state
        del self._group_map
-        del self._processed

    def __repr__(self) -> str:
        return '<GroupByWatcher key="{}" enabled={} callback={}>'.format(