[core] Refactoring IOFormats so there is one and only obvious way to send it.

This is the commit where I admit that having more than one input/output format for readers and writers was complicating the code too much for a very small gain, and that it would be easier to only have one way to do it. So such way is now: - Returning (or yielding) a dict if you have key-value type collections. - Returning (or yielding) a tuple if you have a list-type collection. - Returning (or yielding) something else otherwise, which will continue to work like the old "arg0" format. IOFORMAT options has been removed in favour of a RemovedOption, which will complain if you're still trying to set it to anything else than the one value allowed.
2017-10-15 21:37:22 +02:00
parent dc59c88c3d
commit 92cc400fe7
27 changed files with 427 additions and 269 deletions
--- a/tests/execution/test_node.py
+++ b/tests/execution/test_node.py
@ -0,0 +1,104 @@
+from bonobo import Bag, Graph
+from bonobo.strategies import NaiveStrategy
+from bonobo.util.testing import BufferingNodeExecutionContext, BufferingGraphExecutionContext
+
+
+def test_node_string():
+    def f():
+        return 'foo'
+
+    with BufferingNodeExecutionContext(f) as context:
+        context.write_sync(Bag())
+        output = context.get_buffer()
+
+        assert len(output) == 1
+        assert output[0] == (('foo', ), {})
+
+    def g():
+        yield 'foo'
+        yield 'bar'
+
+    with BufferingNodeExecutionContext(g) as context:
+        context.write_sync(Bag())
+        output = context.get_buffer()
+
+        assert len(output) == 2
+        assert output[0] == (('foo', ), {})
+        assert output[1] == (('bar', ), {})
+
+
+def test_node_bytes():
+    def f():
+        return b'foo'
+
+    with BufferingNodeExecutionContext(f) as context:
+        context.write_sync(Bag())
+
+        output = context.get_buffer()
+        assert len(output) == 1
+        assert output[0] == ((b'foo', ), {})
+
+    def g():
+        yield b'foo'
+        yield b'bar'
+
+    with BufferingNodeExecutionContext(g) as context:
+        context.write_sync(Bag())
+        output = context.get_buffer()
+
+        assert len(output) == 2
+        assert output[0] == ((b'foo', ), {})
+        assert output[1] == ((b'bar', ), {})
+
+
+def test_node_dict():
+    def f():
+        return {'id': 1, 'name': 'foo'}
+
+    with BufferingNodeExecutionContext(f) as context:
+        context.write_sync(Bag())
+        output = context.get_buffer()
+
+        assert len(output) == 1
+        assert output[0] == {'id': 1, 'name': 'foo'}
+
+    def g():
+        yield {'id': 1, 'name': 'foo'}
+        yield {'id': 2, 'name': 'bar'}
+
+    with BufferingNodeExecutionContext(g) as context:
+        context.write_sync(Bag())
+        output = context.get_buffer()
+
+        assert len(output) == 2
+        assert output[0] == {'id': 1, 'name': 'foo'}
+        assert output[1] == {'id': 2, 'name': 'bar'}
+
+
+def test_node_dict_chained():
+    strategy = NaiveStrategy(GraphExecutionContextType=BufferingGraphExecutionContext)
+
+    def uppercase_name(**kwargs):
+        return {**kwargs, 'name': kwargs['name'].upper()}
+
+    def f():
+        return {'id': 1, 'name': 'foo'}
+
+    graph = Graph(f, uppercase_name)
+    context = strategy.execute(graph)
+    output = context.get_buffer()
+
+    assert len(output) == 1
+    assert output[0] == {'id': 1, 'name': 'FOO'}
+
+    def g():
+        yield {'id': 1, 'name': 'foo'}
+        yield {'id': 2, 'name': 'bar'}
+
+    graph = Graph(g, uppercase_name)
+    context = strategy.execute(graph)
+    output = context.get_buffer()
+
+    assert len(output) == 2
+    assert output[0] == {'id': 1, 'name': 'FOO'}
+    assert output[1] == {'id': 2, 'name': 'BAR'}
--- a/tests/io/test_csv.py
+++ b/tests/io/test_csv.py
@ -3,25 +3,19 @@ import pytest
 from bonobo import Bag, CsvReader, CsvWriter, settings
 from bonobo.constants import BEGIN, END
 from bonobo.execution.node import NodeExecutionContext
-from bonobo.util.testing import CapturingNodeExecutionContext, FilesystemTester
+from bonobo.util.testing import FilesystemTester, BufferingNodeExecutionContext

 csv_tester = FilesystemTester('csv')
 csv_tester.input_data = 'a,b,c\na foo,b foo,c foo\na bar,b bar,c bar'


-def test_write_csv_to_file_arg0(tmpdir):
+def test_write_csv_ioformat_arg0(tmpdir):
    fs, filename, services = csv_tester.get_services_for_writer(tmpdir)
+    with pytest.raises(ValueError):
+        CsvWriter(path=filename, ioformat=settings.IOFORMAT_ARG0)

-    with NodeExecutionContext(CsvWriter(path=filename, ioformat=settings.IOFORMAT_ARG0), services=services) as context:
-        context.write(BEGIN, Bag({'foo': 'bar'}), Bag({'foo': 'baz', 'ignore': 'this'}), END)
-        context.step()
-        context.step()
-
-    with fs.open(filename) as fp:
-        assert fp.read() == 'foo\nbar\nbaz\n'
-
-    with pytest.raises(AttributeError):
-        getattr(context, 'file')
+    with pytest.raises(ValueError):
+        CsvReader(path=filename, delimiter=',', ioformat=settings.IOFORMAT_ARG0),


@pytest.mark.parametrize('add_kwargs', ({}, {
@ -30,7 +24,7 @@ def test_write_csv_to_file_arg0(tmpdir):
 def test_write_csv_to_file_kwargs(tmpdir, add_kwargs):
    fs, filename, services = csv_tester.get_services_for_writer(tmpdir)

-    with NodeExecutionContext(CsvWriter(path=filename, **add_kwargs), services=services) as context:
+    with NodeExecutionContext(CsvWriter(filename, **add_kwargs), services=services) as context:
        context.write(BEGIN, Bag(**{'foo': 'bar'}), Bag(**{'foo': 'baz', 'ignore': 'this'}), END)
        context.step()
        context.step()
@ -42,61 +36,24 @@ def test_write_csv_to_file_kwargs(tmpdir, add_kwargs):
        getattr(context, 'file')


-def test_read_csv_from_file_arg0(tmpdir):
-    fs, filename, services = csv_tester.get_services_for_reader(tmpdir)
-
-    with CapturingNodeExecutionContext(
-        CsvReader(path=filename, delimiter=',', ioformat=settings.IOFORMAT_ARG0),
-        services=services,
-    ) as context:
-        context.write(BEGIN, Bag(), END)
-        context.step()
-
-    assert len(context.send.mock_calls) == 2
-
-    args0, kwargs0 = context.send.call_args_list[0]
-    assert len(args0) == 1 and not len(kwargs0)
-    args1, kwargs1 = context.send.call_args_list[1]
-    assert len(args1) == 1 and not len(kwargs1)
-
-    assert args0[0].args[0] == {
-        'a': 'a foo',
-        'b': 'b foo',
-        'c': 'c foo',
-    }
-    assert args1[0].args[0] == {
-        'a': 'a bar',
-        'b': 'b bar',
-        'c': 'c bar',
-    }
-
-
 def test_read_csv_from_file_kwargs(tmpdir):
    fs, filename, services = csv_tester.get_services_for_reader(tmpdir)

-    with CapturingNodeExecutionContext(
+    with BufferingNodeExecutionContext(
        CsvReader(path=filename, delimiter=','),
        services=services,
    ) as context:
        context.write(BEGIN, Bag(), END)
        context.step()
+        output = context.get_buffer()

-    assert len(context.send.mock_calls) == 2
-
-    args0, kwargs0 = context.send.call_args_list[0]
-    assert len(args0) == 1 and not len(kwargs0)
-    args1, kwargs1 = context.send.call_args_list[1]
-    assert len(args1) == 1 and not len(kwargs1)
-
-    _args, _kwargs = args0[0].get()
-    assert not len(_args) and _kwargs == {
+    assert len(output) == 2
+    assert output[0] == {
        'a': 'a foo',
        'b': 'b foo',
        'c': 'c foo',
    }
-
-    _args, _kwargs = args1[0].get()
-    assert not len(_args) and _kwargs == {
+    assert output[1] == {
        'a': 'a bar',
        'b': 'b bar',
        'c': 'c bar',
--- a/tests/io/test_file.py
+++ b/tests/io/test_file.py
@ -3,7 +3,7 @@ import pytest
 from bonobo import Bag, FileReader, FileWriter
 from bonobo.constants import BEGIN, END
 from bonobo.execution.node import NodeExecutionContext
-from bonobo.util.testing import CapturingNodeExecutionContext, FilesystemTester
+from bonobo.util.testing import BufferingNodeExecutionContext, FilesystemTester

 txt_tester = FilesystemTester('txt')
 txt_tester.input_data = 'Hello\nWorld\n'
@ -41,16 +41,10 @@ def test_file_writer_in_context(tmpdir, lines, output):
 def test_file_reader(tmpdir):
    fs, filename, services = txt_tester.get_services_for_reader(tmpdir)

-    with CapturingNodeExecutionContext(FileReader(path=filename), services=services) as context:
-        context.write(BEGIN, Bag(), END)
-        context.step()
+    with BufferingNodeExecutionContext(FileReader(path=filename), services=services) as context:
+        context.write_sync(Bag())
+        output = context.get_buffer()

-    assert len(context.send.mock_calls) == 2
-
-    args0, kwargs0 = context.send.call_args_list[0]
-    assert len(args0) == 1 and not len(kwargs0)
-    args1, kwargs1 = context.send.call_args_list[1]
-    assert len(args1) == 1 and not len(kwargs1)
-
-    assert args0[0].args[0] == 'Hello'
-    assert args1[0].args[0] == 'World'
+    assert len(output) == 2
+    assert output[0] == 'Hello'
+    assert output[1] == 'World'
--- a/tests/io/test_json.py
+++ b/tests/io/test_json.py
@ -3,21 +3,20 @@ import pytest
 from bonobo import Bag, JsonReader, JsonWriter, settings
 from bonobo.constants import BEGIN, END
 from bonobo.execution.node import NodeExecutionContext
-from bonobo.util.testing import CapturingNodeExecutionContext, FilesystemTester
+from bonobo.util.testing import FilesystemTester

 json_tester = FilesystemTester('json')
 json_tester.input_data = '''[{"x": "foo"},{"x": "bar"}]'''


-def test_write_json_arg0(tmpdir):
+def test_write_json_ioformat_arg0(tmpdir):
    fs, filename, services = json_tester.get_services_for_writer(tmpdir)

-    with NodeExecutionContext(JsonWriter(filename, ioformat=settings.IOFORMAT_ARG0), services=services) as context:
-        context.write(BEGIN, Bag({'foo': 'bar'}), END)
-        context.step()
+    with pytest.raises(ValueError):
+        JsonWriter(filename, ioformat=settings.IOFORMAT_ARG0)

-    with fs.open(filename) as fp:
-        assert fp.read() == '[{"foo": "bar"}]'
+    with pytest.raises(ValueError):
+        JsonReader(filename, ioformat=settings.IOFORMAT_ARG0),


@pytest.mark.parametrize('add_kwargs', ({}, {
@ -32,24 +31,3 @@ def test_write_json_kwargs(tmpdir, add_kwargs):

    with fs.open(filename) as fp:
        assert fp.read() == '[{"foo": "bar"}]'
-
-
-def test_read_json_arg0(tmpdir):
-    fs, filename, services = json_tester.get_services_for_reader(tmpdir)
-
-    with CapturingNodeExecutionContext(
-        JsonReader(filename, ioformat=settings.IOFORMAT_ARG0),
-        services=services,
-    ) as context:
-        context.write(BEGIN, Bag(), END)
-        context.step()
-
-    assert len(context.send.mock_calls) == 2
-
-    args0, kwargs0 = context.send.call_args_list[0]
-    assert len(args0) == 1 and not len(kwargs0)
-    args1, kwargs1 = context.send.call_args_list[1]
-    assert len(args1) == 1 and not len(kwargs1)
-
-    assert args0[0].args[0] == {'x': 'foo'}
-    assert args1[0].args[0] == {'x': 'bar'}
--- a/tests/io/test_pickle.py
+++ b/tests/io/test_pickle.py
@ -2,10 +2,9 @@ import pickle

 import pytest

-from bonobo import Bag, PickleReader, PickleWriter, settings
-from bonobo.constants import BEGIN, END
+from bonobo import Bag, PickleReader, PickleWriter
 from bonobo.execution.node import NodeExecutionContext
-from bonobo.util.testing import CapturingNodeExecutionContext, FilesystemTester
+from bonobo.util.testing import BufferingNodeExecutionContext, FilesystemTester

 pickle_tester = FilesystemTester('pkl', mode='wb')
 pickle_tester.input_data = pickle.dumps([['a', 'b', 'c'], ['a foo', 'b foo', 'c foo'], ['a bar', 'b bar', 'c bar']])
@ -14,10 +13,8 @@ pickle_tester.input_data = pickle.dumps([['a', 'b', 'c'], ['a foo', 'b foo', 'c
 def test_write_pickled_dict_to_file(tmpdir):
    fs, filename, services = pickle_tester.get_services_for_writer(tmpdir)

-    with NodeExecutionContext(PickleWriter(filename, ioformat=settings.IOFORMAT_ARG0), services=services) as context:
-        context.write(BEGIN, Bag({'foo': 'bar'}), Bag({'foo': 'baz', 'ignore': 'this'}), END)
-        context.step()
-        context.step()
+    with NodeExecutionContext(PickleWriter(filename), services=services) as context:
+        context.write_sync(Bag({'foo': 'bar'}), Bag({'foo': 'baz', 'ignore': 'this'}))

    with fs.open(filename, 'rb') as fp:
        assert pickle.loads(fp.read()) == {'foo': 'bar'}
@ -29,25 +26,17 @@ def test_write_pickled_dict_to_file(tmpdir):
 def test_read_pickled_list_from_file(tmpdir):
    fs, filename, services = pickle_tester.get_services_for_reader(tmpdir)

-    with CapturingNodeExecutionContext(
-        PickleReader(filename, ioformat=settings.IOFORMAT_ARG0), services=services
-    ) as context:
-        context.write(BEGIN, Bag(), END)
-        context.step()
+    with BufferingNodeExecutionContext(PickleReader(filename), services=services) as context:
+        context.write_sync(Bag())
+        output = context.get_buffer()

-    assert len(context.send.mock_calls) == 2
-
-    args0, kwargs0 = context.send.call_args_list[0]
-    assert len(args0) == 1 and not len(kwargs0)
-    args1, kwargs1 = context.send.call_args_list[1]
-    assert len(args1) == 1 and not len(kwargs1)
-
-    assert args0[0].args[0] == {
+    assert len(output) == 2
+    assert output[0] == {
        'a': 'a foo',
        'b': 'b foo',
        'c': 'c foo',
    }
-    assert args1[0].args[0] == {
+    assert output[1] == {
        'a': 'a bar',
        'b': 'b bar',
        'c': 'c bar',
--- a/tests/test_basicusage.py
+++ b/tests/test_basicusage.py
@ -12,4 +12,5 @@ def test_run_graph_noop():

    with patch('bonobo._api._is_interactive_console', side_effect=lambda: False):
        result = bonobo.run(graph)
+
    assert isinstance(result, GraphExecutionContext)
--- a/tests/test_commands.py
+++ b/tests/test_commands.py
@ -30,9 +30,13 @@ def test_entrypoint():
    for command in pkg_resources.iter_entry_points('bonobo.commands'):
        commands[command.name] = command

-    assert 'init' in commands
-    assert 'run' in commands
-    assert 'version' in commands
+    assert not {
+        'convert',
+        'init',
+        'inspect',
+        'run',
+        'version',
+    }.difference(set(commands))


@all_runners
--- a/tests/test_execution.py
+++ b/tests/test_execution.py
@ -51,31 +51,31 @@ def test_simple_execution_context():
    graph = Graph()
    graph.add_chain(*chain)

-    ctx = GraphExecutionContext(graph)
-    assert len(ctx.nodes) == len(chain)
-    assert not len(ctx.plugins)
+    context = GraphExecutionContext(graph)
+    assert len(context.nodes) == len(chain)
+    assert not len(context.plugins)

    for i, node in enumerate(chain):
-        assert ctx[i].wrapped is node
+        assert context[i].wrapped is node

-    assert not ctx.alive
-    assert not ctx.started
-    assert not ctx.stopped
+    assert not context.alive
+    assert not context.started
+    assert not context.stopped

-    ctx.write(BEGIN, Bag(), END)
+    context.write(BEGIN, Bag(), END)

-    assert not ctx.alive
-    assert not ctx.started
-    assert not ctx.stopped
+    assert not context.alive
+    assert not context.started
+    assert not context.stopped

-    ctx.start()
+    context.start()

-    assert ctx.alive
-    assert ctx.started
-    assert not ctx.stopped
+    assert context.alive
+    assert context.started
+    assert not context.stopped

-    ctx.stop()
+    context.stop()

-    assert not ctx.alive
-    assert ctx.started
-    assert ctx.stopped
+    assert not context.alive
+    assert context.started
+    assert context.stopped