Changeset - f508df06c162
[Not reviewed]
0 3 0
Brett Smith - 3 years ago 2021-02-19 23:54:36
brettcsmith@brettcsmith.org
rewrite: Richer exceptions for error reporting.
3 files changed with 131 insertions and 50 deletions:
0 comments (0 inline, 0 general)
conservancy_beancount/errors.py
Show inline comments
...
 
@@ -6,12 +6,13 @@
 
# LICENSE.txt in the repository.
 

	
 
import beancount.core.data as bc_data
 

	
 
from typing import (
 
    Any,
 
    ClassVar,
 
    Iterable,
 
    Optional,
 
)
 

	
 
from .beancount_types import (
 
    Directive,
...
 
@@ -124,6 +125,44 @@ class InvalidMetadataError(Error):
 
            msg = "{} has wrong type of {}: expected {} but is a {}".format(
 
                srcname, key, need_type.__name__, type(value).__name__,
 
            )
 
        super().__init__(msg, txn, source)
 
        self.key = key
 
        self.value = value
 

	
 

	
 
class RewriteRuleError(ValueError):
 
    item_type: ClassVar[Optional[str]] = None
 

	
 
    def __init__(self,
 
                 message: str,
 
                 filename: Optional[str]=None,
 
                 rulenum: Optional[int]=None,
 
                 source: Optional[Any]=None,
 
    ) -> None:
 
        super().__init__(message, filename, rulenum, source)
 
        self.message = message
 
        self.filename = filename
 
        self.rulenum = rulenum
 
        self.source = source
 

	
 
    def __str__(self) -> str:
 
        msg_parts = [self.message]
 
        if self.filename is not None:
 
            msg_parts.append(f"in {self.filename}")
 
        if self.rulenum is not None:
 
            msg_parts.append(f"rule #{self.rulenum}")
 
            if self.item_type is not None:
 
                msg_parts.append(self.item_type)
 
        return ' '.join(msg_parts)
 

	
 

	
 
class RewriteRuleActionError(RewriteRuleError):
 
    item_type = 'action'
 

	
 

	
 
class RewriteRuleConditionError(RewriteRuleError):
 
    item_type = 'condition'
 

	
 

	
 
class RewriteRuleLoadError(RewriteRuleError): pass
 
class RewriteRuleValidationError(RewriteRuleError): pass
conservancy_beancount/reports/rewrite.py
Show inline comments
...
 
@@ -146,12 +146,13 @@ import enum
 
import functools
 
import logging
 
import operator as opmod
 
import re
 

	
 
from typing import (
 
    Any,
 
    Callable,
 
    Dict,
 
    Generic,
 
    IO,
 
    Iterable,
 
    Iterator,
...
 
@@ -174,12 +175,13 @@ from ..beancount_types import (
 

	
 
from pathlib import Path
 

	
 
import yaml
 

	
 
from .. import data
 
from .. import errors
 

	
 
Decimal = decimal.Decimal
 
T = TypeVar('T')
 
TestCallable = Callable[[T, T], bool]
 

	
 
CMP_OPS: Mapping[str, TestCallable] = {
...
 
@@ -196,28 +198,28 @@ CMP_OPS: Mapping[str, TestCallable] = {
 
SUBJECT_PAT = r'((?:\.\w+)+|[a-z][-\w]*)\b\s*'
 

	
 
logger = logging.getLogger('conservancy_beancount.reports.rewrite')
 

	
 
class _Registry(Generic[T]):
 
    def __init__(self,
 
                 description: str,
 
                 error_cls: Type[errors.RewriteRuleError],
 
                 parser: Union[str, Pattern],
 
                 default: Type[T],
 
                 *others: Tuple[str, Type[T]],
 
    ) -> None:
 
        if isinstance(parser, str):
 
            parser = re.compile(parser)
 
        self.description = description
 
        self.error_cls = error_cls
 
        self.parser = parser
 
        self.default = default
 
        self.registry: Mapping[str, Type[T]] = dict(others)
 

	
 
    def parse(self, s: str) -> T:
 
        match = self.parser.match(s)
 
        if match is None:
 
            raise ValueError(f"could not parse {self.description} {s!r}")
 
            raise self.error_cls(f"parse error: {s!r}")
 
        subject = match.group(1)
 
        operator = match.group(2)
 
        operand = s[match.end():].strip()
 
        if not subject.startswith('.'):
 
            # FIXME: To avoid this type ignore, I would have to define a common
 
            # superclass for Tester and Setter that provides a useful signature
...
 
@@ -225,25 +227,26 @@ class _Registry(Generic[T]):
 
            # and then use that as the bound for our type variable.
 
            # Not a priority right now.
 
            return self.default(subject, operator, operand)  # type:ignore[call-arg]
 
        try:
 
            retclass = self.registry[subject]
 
        except KeyError:
 
            raise ValueError(f"unknown subject in {self.description} {subject!r}") from None
 
            raise self.error_cls(f"unknown subject: {subject!r}") from None
 
        else:
 
            return retclass(operator, operand)  # type:ignore[call-arg]
 

	
 

	
 
class Tester(Generic[T], metaclass=abc.ABCMeta):
 
    ERROR = errors.RewriteRuleConditionError
 
    OPS: Mapping[str, TestCallable] = CMP_OPS
 

	
 
    def __init__(self, operator: str, operand: str) -> None:
 
        try:
 
            self.op_func = self.OPS[operator]
 
        except KeyError:
 
            raise ValueError(f"unsupported operator {operator!r}") from None
 
            raise self.ERROR(f"unsupported operator: {operator!r}") from None
 
        self.operand = self.parse_operand(operand)
 

	
 
    @staticmethod
 
    @abc.abstractmethod
 
    def parse_operand(operand: str) -> T: ...
 

	
...
 
@@ -265,13 +268,13 @@ class AccountTest(Tester[str]):
 

	
 
    @staticmethod
 
    def parse_operand(operand: str) -> str:
 
        if data.Account.is_account(f'{operand}:RootsOK'):
 
            return operand
 
        else:
 
            raise ValueError(f"invalid account name {operand!r}")
 
            raise errors.RewriteRuleConditionError(f"invalid account name: {operand!r}")
 

	
 
    def post_get(self, post: data.Posting) -> str:
 
        return post.account
 

	
 
    def __call__(self, post: data.Posting) -> bool:
 
        try:
...
 
@@ -280,13 +283,16 @@ class AccountTest(Tester[str]):
 
            return super().__call__(post)
 

	
 

	
 
class DateTest(Tester[datetime.date]):
 
    @staticmethod
 
    def parse_operand(operand: str) -> datetime.date:
 
        return datetime.datetime.strptime(operand, '%Y-%m-%d').date()
 
        try:
 
            return datetime.datetime.strptime(operand, '%Y-%m-%d').date()
 
        except ValueError as error:
 
            raise errors.RewriteRuleConditionError(error.args[0])
 

	
 
    def post_get(self, post: data.Posting) -> datetime.date:
 
        return post.meta.date
 

	
 

	
 
class MetadataTest(Tester[Optional[MetaValue]]):
...
 
@@ -326,20 +332,20 @@ class MetadataTest(Tester[Optional[MetaValue]]):
 
class NumberTest(Tester[Decimal]):
 
    @staticmethod
 
    def parse_operand(operand: str) -> Decimal:
 
        try:
 
            return Decimal(operand)
 
        except decimal.DecimalException:
 
            raise ValueError(f"could not parse decimal {operand!r}")
 
            raise errors.RewriteRuleConditionError(f"decimal parse error: {operand!r}")
 

	
 
    def post_get(self, post: data.Posting) -> Decimal:
 
        return post.units.number
 

	
 

	
 
TestRegistry: _Registry[Tester] = _Registry(
 
    'condition',
 
    Tester.ERROR,
 
    '^{}{}'.format(
 
        SUBJECT_PAT,
 
        r'({}|in)'.format('|'.join(re.escape(s) for s in Tester.OPS)),
 
    ),
 
    MetadataTest,
 
    ('.account', AccountTest),
...
 
@@ -350,51 +356,62 @@ TestRegistry: _Registry[Tester] = _Registry(
 
class Setter(Generic[T], metaclass=abc.ABCMeta):
 
    _regparser = re.compile(r'^{}{}'.format(
 
        SUBJECT_PAT,
 
        r'',
 
    ))
 
    _regtype = 'setter'
 
    ERROR = errors.RewriteRuleActionError
 

	
 
    @abc.abstractmethod
 
    def __call__(self, post: data.Posting) -> Tuple[str, T]: ...
 

	
 

	
 
class AccountSet(Setter[data.Account]):
 
    def __init__(self, operator: str, value: str) -> None:
 
        if operator != '=':
 
            raise ValueError(f"unsupported operator for account {operator!r}")
 
        self.value = data.Account(AccountTest.parse_operand(value))
 
            raise self.ERROR(f"unsupported operator for account: {operator!r}")
 
        try:
 
            self.value = data.Account(AccountTest.parse_operand(value))
 
        except errors.RewriteRuleConditionError as error:
 
            new_error = errors.RewriteRuleActionError(*error.args)
 
            new_error.__cause__ = error.__cause__
 
            raise new_error
 

	
 
    def __call__(self, post: data.Posting) -> Tuple[str, data.Account]:
 
        return ('account', self.value)
 

	
 

	
 
class MetadataSet(Setter[str]):
 
    def __init__(self, key: str, operator: str, value: str) -> None:
 
        if operator != '=':
 
            raise ValueError(f"unsupported operator for metadata {operator!r}")
 
            raise self.ERROR(f"unsupported operator for metadata: {operator!r}")
 
        self.key = key
 
        self.value = value
 

	
 
    def __call__(self, post: data.Posting) -> Tuple[str, str]:
 
        return (self.key, self.value)
 

	
 

	
 
class NumberSet(Setter[data.Amount]):
 
    def __init__(self, operator: str, value: str) -> None:
 
        if operator != '*=':
 
            raise ValueError(f"unsupported operator for number {operator!r}")
 
        self.value = NumberTest.parse_operand(value)
 
            raise self.ERROR(f"unsupported operator for number: {operator!r}")
 
        try:
 
            self.value = NumberTest.parse_operand(value)
 
        except errors.RewriteRuleConditionError as error:
 
            new_error = errors.RewriteRuleActionError(*error.args)
 
            new_error.__cause__ = error.__cause__
 
            raise new_error
 

	
 
    def __call__(self, post: data.Posting) -> Tuple[str, data.Amount]:
 
        number = post.units.number * self.value
 
        return ('units', post.units._replace(number=number))
 

	
 

	
 
SetRegistry: _Registry[Setter] = _Registry(
 
    'action',
 
    Setter.ERROR,
 
    rf'^{SUBJECT_PAT}([-+/*]?=)',
 
    MetadataSet,
 
    ('.account', AccountSet),
 
    ('.number', NumberSet),
 
)
 

	
...
 
@@ -410,12 +427,14 @@ class _RootAccount(enum.Enum):
 
            return cls[root]
 
        except KeyError:
 
            return cls.Equity
 

	
 

	
 
class RewriteRule:
 
    ERROR = errors.RewriteRuleValidationError
 

	
 
    def __init__(self, source: Mapping[str, List[str]]) -> None:
 
        self.new_meta: List[Sequence[MetadataSet]] = []
 
        self.rewrites: List[Sequence[Setter]] = []
 
        for key, rules in source.items():
 
            if key == 'if':
 
                self.tests = [TestRegistry.parse(rule) for rule in rules]
...
 
@@ -424,24 +443,24 @@ class RewriteRule:
 
                rewrites: List[Setter] = []
 
                for rule_s in rules:
 
                    setter = SetRegistry.parse(rule_s)
 
                    if isinstance(setter, MetadataSet):
 
                        new_meta.append(setter)
 
                    elif any(isinstance(t, type(setter)) for t in rewrites):
 
                        raise ValueError(f"rule conflicts with earlier action: {rule_s!r}")
 
                        raise self.ERROR(f"rule conflicts with earlier action: {rule_s!r}")
 
                    else:
 
                        rewrites.append(setter)
 
                self.new_meta.append(new_meta)
 
                self.rewrites.append(rewrites)
 

	
 
        try:
 
            if_ok = any(self.tests)
 
        except AttributeError:
 
            if_ok = False
 
        if not if_ok:
 
            raise ValueError("no `if` condition in rule") from None
 
            raise self.ERROR("no `if` condition in rule") from None
 

	
 
        account_conditions: Set[_RootAccount] = set()
 
        for test in self.tests:
 
            if isinstance(test, AccountTest):
 
                try:
 
                    operands = test.under_args
...
 
@@ -457,24 +476,24 @@ class RewriteRule:
 
        for rewrite in self.rewrites:
 
            rewrite_number = Decimal(1)
 
            for rule in rewrite:
 
                if isinstance(rule, AccountSet):
 
                    new_root = _RootAccount.from_account(rule.value)
 
                    if new_root is not account_condition:
 
                        raise ValueError(
 
                        raise self.ERROR(
 
                            f"cannot assign {new_root} account "
 
                            f"when `if` checks for {account_condition}",
 
                        )
 
                elif isinstance(rule, NumberSet):
 
                    rewrite_number = rule.value
 
            number_reallocation += rewrite_number
 

	
 
        if not number_reallocation:
 
            raise ValueError("no rewrite actions in rule")
 
            raise self.ERROR("no rewrite actions")
 
        elif number_reallocation != 1:
 
            raise ValueError(f"rule multiplies number by {number_reallocation}")
 
            raise self.ERROR(f"rule multiplies number by {number_reallocation}")
 

	
 
    def match(self, post: data.Posting) -> bool:
 
        return all(test(post) for test in self.tests)
 

	
 
    def rewrite(self, post: data.Posting) -> Iterator[data.Posting]:
 
        for rewrite, new_meta in zip(self.rewrites, self.new_meta):
...
 
@@ -497,26 +516,54 @@ class RewriteRuleset:
 
                    yield from rule.rewrite(post)
 
                    break
 
            else:
 
                yield post
 

	
 
    @classmethod
 
    def from_yaml(cls, source: Union[str, IO, Path]) -> 'RewriteRuleset':
 
    def _iter_yaml(cls, source: Iterable[Any], name: str) -> Iterator[RewriteRule]:
 
        for number, item in enumerate(source, 1):
 
            try:
 
                if not isinstance(item, Mapping):
 
                    raise errors.RewriteRuleLoadError(f"item is not a rule hash")
 
                for key, value in item.items():
 
                    if not isinstance(value, list):
 
                        raise errors.RewriteRuleLoadError(
 
                            f"YAML item {number} {key!r} value is not a list",
 
                        )
 
                    elif not all(isinstance(s, str) for s in value):
 
                        raise errors.RewriteRuleLoadError(
 
                            f"YAML item {number} {key!r} value is not all strings",
 
                        )
 
                yield RewriteRule(item)
 
            except errors.RewriteRuleError as error:
 
                error.filename = name
 
                error.rulenum = number
 
                error.source = item
 
                raise
 

	
 
    @classmethod
 
    def from_yaml(
 
            cls,
 
            source: Union[str, IO, Path],
 
            name: Optional[str]=None,
 
    ) -> 'RewriteRuleset':
 
        if isinstance(source, Path):
 
            with source.open() as source_file:
 
                return cls.from_yaml(source_file)
 
        doc = yaml.safe_load(source)
 
        if not isinstance(doc, list):
 
            raise ValueError("YAML root element is not a list")
 
        for number, item in enumerate(doc, 1):
 
            if not isinstance(item, Mapping):
 
                raise ValueError(f"YAML item {number} is not a rule hash")
 
            for key, value in item.items():
 
                if not isinstance(value, list):
 
                    raise ValueError(f"YAML item {number} {key!r} value is not a list")
 
                elif not all(isinstance(s, str) for s in value):
 
                    raise ValueError(f"YAML item {number} {key!r} value is not all strings")
 
                return cls.from_yaml(source_file, str(source))
 
        if name is None:
 
            if isinstance(source, str):
 
                name = '<string>'
 
            else:
 
                name = getattr(source, 'name', '<file>')
 
        try:
 
            logger.debug("loaded %s rewrite rules from YAML", number)
 
        except NameError:
 
            logger.warning("YAML source is empty; no rewrite rules loaded")
 
        return cls(RewriteRule(src) for src in doc)
 
            doc = yaml.safe_load(source)
 
        except yaml.error.YAMLError as error:
 
            raise errors.RewriteRuleLoadError(str(error), name)
 
        if not isinstance(doc, list):
 
            raise errors.RewriteRuleLoadError("YAML root element is not a list", name)
 
        retval = cls(cls._iter_yaml(doc, name))
 
        logger.log(
 
            logging.DEBUG if retval.rules else logging.WARNING,
 
            "loaded %s rewrite rules from %s",
 
            len(retval.rules), name,
 
        )
 
        return retval
tests/test_reports_rewrite.py
Show inline comments
...
 
@@ -12,13 +12,13 @@ import pytest
 
from decimal import Decimal
 

	
 
import yaml
 

	
 
from . import testutil
 

	
 
from conservancy_beancount import data
 
from conservancy_beancount import data, errors
 
from conservancy_beancount.reports import rewrite
 

	
 
CMP_OPS = frozenset('< <= == != >= >'.split())
 

	
 
@pytest.mark.parametrize('name', ['Equity:Other', 'Expenses:Other', 'Income:Other'])
 
@pytest.mark.parametrize('operator', CMP_OPS)
...
 
@@ -128,13 +128,13 @@ def test_parse_good_condition(subject, operator, operand):
 
    '.number > 0xff',  # Bad operand
 
    '.number in 16',  # Bad operator
 
    'units.number == 5',  # Bad subject (syntax)
 
    '.units == 5',  # Bad subject (unknown)
 
])
 
def test_parse_bad_condition(cond_s):
 
    with pytest.raises(ValueError):
 
    with pytest.raises(errors.RewriteRuleConditionError):
 
        rewrite.TestRegistry.parse(cond_s)
 

	
 
@pytest.mark.parametrize('value', ['Equity:Other', 'Income:Other'])
 
def test_account_set(value):
 
    value = data.Account(value)
 
    txn = testutil.Transaction(postings=[
...
 
@@ -192,13 +192,13 @@ def test_parse_good_set(subject, operator, operand):
 
    '.number*=0xff',  # Bad operand
 
    '.number=5',  # Bad operator
 
    'testkey += foo',  # Bad operator
 
    'testkey *= 3',  # Bad operator
 
])
 
def test_parse_bad_set(set_s):
 
    with pytest.raises(ValueError):
 
    with pytest.raises(errors.RewriteRuleActionError):
 
        rewrite.SetRegistry.parse(set_s)
 

	
 
def test_good_rewrite_rule():
 
    rule = rewrite.RewriteRule({
 
        'if': ['.account in Income'],
 
        'add': ['income-type = Other'],
...
 
@@ -268,32 +268,27 @@ def test_valid_rewrite_rule(source):
 

	
 
@pytest.mark.parametrize('source', [
 
    # Incomplete rules
 
    {},
 
    {'if': ['.account in Equity']},
 
    {'a': ['.account = Income:Other'], 'b': ['.account = Expenses:Other']},
 
    # Condition/assignment mixup
 
    {'if': ['.account = Equity:Other'], 'then': ['equity-type = other']},
 
    {'if': ['.account == Equity:Other'], 'then': ['equity-type != other']},
 
    # Cross-category account assignment
 
    {'if': ['.date >= 2020-01-01'], 'then': ['.account = Assets:Cash']},
 
    {'if': ['.account in Equity'], 'then': ['.account = Assets:Cash']},
 
    # Number reallocation != 1
 
    {'if': ['.date >= 2020-01-01'], 'then': ['.number *= .5']},
 
    {'if': ['.date >= 2020-01-01'], 'a': ['k1=v1'], 'b': ['k2=v2']},
 
    # Date assignment
 
    {'if': ['.date == 2020-01-01'], 'then': ['.date = 2020-02-02']},
 
    # Redundant assignments
 
    {'if': ['.account in Income'],
 
     'then': ['.account = Income:Other', '.account = Income:Other']},
 
    {'if': ['.number > 0'],
 
     'a': ['.number *= .5', '.number *= .5'],
 
     'b': ['.number *= .5']},
 
])
 
def test_invalid_rewrite_rule(source):
 
    with pytest.raises(ValueError):
 
    with pytest.raises(errors.RewriteRuleValidationError):
 
        rewrite.RewriteRule(source)
 

	
 
def test_rewrite_ruleset():
 
    account = 'Income:CurrencyConversion'
 
    ruleset = rewrite.RewriteRuleset(rewrite.RewriteRule(src) for src in [
 
        {'if': ['.account == Expenses:CurrencyConversion'],
...
 
@@ -330,27 +325,27 @@ def test_ruleset_from_yaml_str():
 
    with testutil.test_path('userconfig/Rewrites01.yml').open() as yaml_file:
 
        yaml_s = yaml_file.read()
 
    assert rewrite.RewriteRuleset.from_yaml(yaml_s)
 

	
 
def test_bad_ruleset_yaml_path():
 
    yaml_path = testutil.test_path('repository/Projects/project-data.yml')
 
    with pytest.raises(ValueError):
 
    with pytest.raises(errors.RewriteRuleLoadError):
 
        rewrite.RewriteRuleset.from_yaml(yaml_path)
 

	
 
@pytest.mark.parametrize('source', [
 
    # Wrong root objects
 
    1,
 
    2.3,
 
    True,
 
    None,
 
    {},
 
    'string',
 
    [{}, 'a'],
 
    [{}, ['b']],
 
    ['a'],
 
    [['b']],
 
    # Rules have wrong type
 
    [{'if': '.account in Equity', 'add': ['testkey = value']}],
 
    [{'if': ['.account in Equity'], 'add': 'testkey = value'}],
 
])
 
def test_bad_ruleset_yaml_str(source):
 
    yaml_doc = yaml.safe_dump(source)
 
    with pytest.raises(ValueError):
 
    with pytest.raises(errors.RewriteRuleLoadError):
 
        rewrite.RewriteRuleset.from_yaml(yaml_doc)
0 comments (0 inline, 0 general)