query: Development cleanup.

Reorder classes for nicer readability. Put shorter classes higher up, keep related classes together. Add developer-facing comments. Remove unused imports.
2021-03-09 10:33:11 -05:00 · 2021-03-09 10:33:11 -05:00 · c5a2c2d39b
commit c5a2c2d39b
parent 5893d6a59a
1 changed files with 162 additions and 152 deletions
--- a/conservancy_beancount/reports/query.py
+++ b/conservancy_beancount/reports/query.py
@ -11,12 +11,10 @@ import datetime
 import enum
 import itertools
 import logging
 import re
 import sys
 from typing import (
    cast,
    AbstractSet,
    Any,
    Callable,
    Dict,
@ -35,8 +33,6 @@ from typing import (
 from ..beancount_types import (
    MetaKey,
    MetaValue,
    Posting,
    Transaction,
 )
 from decimal import Decimal
@ -91,6 +87,81 @@ QueryStatement = Union[
    bc_query_parser.Select,
 ]
 # This class supports type checking. Beancount code dynamically sets the
 # ``store`` attribute, in bc_query_execute.execute_query().
 class Context(bc_query_execute.RowContext):
    store: Store
 class MetaDocs(bc_query_env.AnyMeta):
    """Return a list of document links from metadata."""
    def __init__(self, operands: List[str]) -> None:
        super(bc_query_env.AnyMeta, self).__init__(operands, list)
        # The second argument is our return type.
        # It should match the annotated return type of __call__.
    def __call__(self, context: Context) -> List[str]:
        raw_value = super().__call__(context)
        if isinstance(raw_value, str):
            return raw_value.split()
        else:
            return []
 class StrMeta(bc_query_env.AnyMeta):
    """Looks up metadata like AnyMeta, then always returns a string."""
    def __init__(self, operands: List[str]) -> None:
        super(bc_query_env.AnyMeta, self).__init__(operands, str)
    def __call__(self, context: Context) -> str:
        raw_value = super().__call__(context)
        if raw_value is None:
            return ''
        else:
            return str(raw_value)
 class AggregateSet(bc_query_compile.EvalAggregator):
    __intypes__ = [object]
    def __init__(self, operands: List[str]) -> None:
       super().__init__(operands, set)
    def allocate(self, allocator: bc_query_execute.Allocator) -> None:
        """Allocate and save an index handle into result storage."""
        self.handle = allocator.allocate()
    def initialize(self, store: Store) -> None:
        """Prepare result storage for a new aggregation."""
        store[self.handle] = self.dtype()
        # self.dtype() is our return type, aka the second argument to __init__
        # above, aka the annotated return type of __call__.
    def update(self, store: Store, context: Context) -> None:
        """Update existing storage with new result data."""
        value, = self.eval_args(context)
        if isinstance(value, Sequence) and not isinstance(value, (str, tuple)):
            store[self.handle].update(value)
        else:
            store[self.handle].add(value)
    def __call__(self, context: Context) -> set:
        """Return the result for an aggregation."""
        return context.store[self.handle]  # type:ignore[no-any-return]
 class FilterPostingsEnvironment(bc_query_env.FilterPostingsEnvironment):
    functions: EnvironmentFunctions = bc_query_env.FilterPostingsEnvironment.functions.copy()  # type:ignore[assignment]
    functions['meta_docs'] = MetaDocs
    functions['str_meta'] = StrMeta
 class TargetsEnvironment(bc_query_env.TargetsEnvironment):
    functions = FilterPostingsEnvironment.functions.copy()
    functions.update(bc_query_env.AGGREGATOR_FUNCTIONS)
    functions['set'] = AggregateSet
 class BooksLoader:
    """Closure to load books with a zero-argument callable
@ -128,8 +199,91 @@ class BooksLoader:
        return result
 class BQLShell(bc_query_shell.BQLShell):
    def __init__(
            self,
            is_interactive: bool,
            loadfun: Callable[[], books.LoadResult],
            outfile: TextIO,
            default_format: str='text',
            do_numberify: bool=False,
            rt_wrapper: Optional[rtutil.RT]=None,
    ) -> None:
        super().__init__(is_interactive, loadfun, outfile, default_format, do_numberify)
        self.env_postings = FilterPostingsEnvironment()
        self.env_targets = TargetsEnvironment()
        self.ods = QueryODS(rt_wrapper)
    def on_Select(self, statement: QueryStatement) -> None:
        output_format: str = self.vars['format']
        try:
            render_func = getattr(self, f'_render_{output_format}')
        except AttributeError:
            logger.error("unknown output format %r", output_format)
            return
        try:
            logger.debug("compiling query")
            compiled_query = bc_query_compile.compile(
                statement, self.env_targets, self.env_postings, self.env_entries,
            )
            logger.debug("executing query")
            row_types, rows = bc_query_execute.execute_query(
                compiled_query, self.entries, self.options_map,
            )
            if self.vars['numberify']:
                logger.debug("numberifying query")
                row_types, rows = bc_query_numberify.numberify_results(
                    row_types, rows, self.options_map['dcontext'].build(),
                )
        except Exception as error:
            logger.error(str(error), exc_info=logger.isEnabledFor(logging.DEBUG))
            return
        if not rows and output_format != 'ods':
            print("(empty)", file=self.outfile)
        else:
            logger.debug("rendering query as %s", output_format)
            render_func(statement, row_types, rows)
    def _render_csv(self, statement: QueryStatement, row_types: RowTypes, rows: Rows) -> None:
        bc_query_render.render_csv(
            row_types,
            rows,
            self.options_map['dcontext'],
            self.outfile,
            self.vars['expand'],
        )
    def _render_ods(self, statement: QueryStatement, row_types: RowTypes, rows: Rows) -> None:
        self.ods.write_query(statement, row_types, rows)
        logger.info(
            "%s rows of results saved in sheet %s",
            len(rows),
            self.ods.sheet.getAttribute('name'),
        )
    def _render_text(self, statement: QueryStatement, row_types: RowTypes, rows: Rows) -> None:
        with contextlib.ExitStack() as stack:
            if self.is_interactive:
                output = stack.enter_context(self.get_pager())
            else:
                output = self.outfile
            bc_query_render.render_text(
                row_types,
                rows,
                self.options_map['dcontext'],
                output,
                self.vars['expand'],
                self.vars['boxed'],
                self.vars['spaced'],
            )
 class QueryODS(core.BaseODS[NamedTuple, None]):
    META_FNAMES = frozenset([
        # Names of functions, as defined in Environments, that look up
        # posting metadata that could contain documentation links
        'any_meta',
        'entry_meta',
        'meta',
@ -264,154 +418,6 @@ class QueryODS(core.BaseODS[NamedTuple, None]):
            ))
 # This class mostly supports type checking. Beancount code dynamically sets the
 # ``store`` attribute, in bc_query_execute.execute_query().
 class Context(bc_query_execute.RowContext):
    store: Store
 class MetaDocs(bc_query_env.AnyMeta):
    """Return a list of document links from metadata."""
    def __init__(self, operands: List[str]) -> None:
        super(bc_query_env.AnyMeta, self).__init__(operands, list)
    def __call__(self, context: Context) -> List[str]:
        raw_value = super().__call__(context)
        if isinstance(raw_value, str):
            return raw_value.split()
        else:
            return []
 class StrMeta(bc_query_env.AnyMeta):
    """Looks up metadata like AnyMeta, then always returns a string."""
    def __init__(self, operands: List[str]) -> None:
        super(bc_query_env.AnyMeta, self).__init__(operands, str)
    def __call__(self, context: Context) -> str:
        raw_value = super().__call__(context)
        if raw_value is None:
            return ''
        else:
            return str(raw_value)
 class AggregateSet(bc_query_compile.EvalAggregator):
    __intypes__ = [object]
    def __init__(self, operands: List[str]) -> None:
       super().__init__(operands, set)
    def allocate(self, allocator: bc_query_execute.Allocator) -> None:
        self.handle = allocator.allocate()
    def initialize(self, store: Store) -> None:
        store[self.handle] = self.dtype()
    def update(self, store: Store, context: Context) -> None:
        value, = self.eval_args(context)
        if isinstance(value, Sequence) and not isinstance(value, (str, tuple)):
            store[self.handle].update(value)
        else:
            store[self.handle].add(value)
    def __call__(self, context: Context) -> set:
        return context.store[self.handle]  # type:ignore[no-any-return]
 class FilterPostingsEnvironment(bc_query_env.FilterPostingsEnvironment):
    functions: EnvironmentFunctions = bc_query_env.FilterPostingsEnvironment.functions.copy()  # type:ignore[assignment]
    functions['meta_docs'] = MetaDocs
    functions['str_meta'] = StrMeta
 class TargetsEnvironment(bc_query_env.TargetsEnvironment):
    functions = FilterPostingsEnvironment.functions.copy()
    functions.update(bc_query_env.AGGREGATOR_FUNCTIONS)
    functions['set'] = AggregateSet
 class BQLShell(bc_query_shell.BQLShell):
    def __init__(
            self,
            is_interactive: bool,
            loadfun: Callable[[], books.LoadResult],
            outfile: TextIO,
            default_format: str='text',
            do_numberify: bool=False,
            rt_wrapper: Optional[rtutil.RT]=None,
    ) -> None:
        super().__init__(is_interactive, loadfun, outfile, default_format, do_numberify)
        self.env_postings = FilterPostingsEnvironment()
        self.env_targets = TargetsEnvironment()
        self.ods = QueryODS(rt_wrapper)
    def on_Select(self, statement: QueryStatement) -> None:
        output_format: str = self.vars['format']
        try:
            render_func = getattr(self, f'_render_{output_format}')
        except AttributeError:
            logger.error("unknown output format %r", output_format)
            return
        try:
            logger.debug("compiling query")
            compiled_query = bc_query_compile.compile(
                statement, self.env_targets, self.env_postings, self.env_entries,
            )
            logger.debug("executing query")
            row_types, rows = bc_query_execute.execute_query(
                compiled_query, self.entries, self.options_map,
            )
            if self.vars['numberify']:
                logger.debug("numberifying query")
                row_types, rows = bc_query_numberify.numberify_results(
                    row_types, rows, self.options_map['dcontext'].build(),
                )
        except Exception as error:
            logger.error(str(error), exc_info=logger.isEnabledFor(logging.DEBUG))
            return
        if not rows and output_format != 'ods':
            print("(empty)", file=self.outfile)
        else:
            logger.debug("rendering query as %s", output_format)
            render_func(statement, row_types, rows)
    def _render_csv(self, statement: QueryStatement, row_types: RowTypes, rows: Rows) -> None:
        bc_query_render.render_csv(
            row_types,
            rows,
            self.options_map['dcontext'],
            self.outfile,
            self.vars['expand'],
        )
    def _render_ods(self, statement: QueryStatement, row_types: RowTypes, rows: Rows) -> None:
        self.ods.write_query(statement, row_types, rows)
        logger.info(
            "%s rows of results saved in sheet %s",
            len(rows),
            self.ods.sheet.getAttribute('name'),
        )
    def _render_text(self, statement: QueryStatement, row_types: RowTypes, rows: Rows) -> None:
        with contextlib.ExitStack() as stack:
            if self.is_interactive:
                output = stack.enter_context(self.get_pager())
            else:
                output = self.outfile
            bc_query_render.render_text(
                row_types,
                rows,
                self.options_map['dcontext'],
                output,
                self.vars['expand'],
                self.vars['boxed'],
                self.vars['spaced'],
            )
 class ReportFormat(enum.Enum):
    TEXT = 'text'
    TXT = TEXT
@ -442,6 +448,10 @@ class SetFYDates(argparse.Action):
    ) -> None:
        value = cliutil.year_or_date_arg(str(values))
        namespace.start_date = value
        # The configuration hasn't been loaded, so we don't know the boundaries
        # of a fiscal year yet. But that's okay, because we just need to set
        # enough so that when these arguments are passed to a BooksLoader,
        # it'll load the right fiscal year.
        if isinstance(value, int):
            namespace.stop_date = value
        else: