Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

[frozen] pyDKB.dataflow.stage tests #196

Open
wants to merge 28 commits into
base: pyDKB
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from 17 commits
Commits
Show all changes
28 commits
Select commit Hold shift + click to select a range
4c1c44a
Added command line arguments tests.
Evildoor Nov 16, 2018
e1343c5
Updated a check_args method.
Evildoor Nov 19, 2018
1022253
Reworked mode tests.
Evildoor Nov 19, 2018
088e180
Added testing for arguments' interactions.
Evildoor Nov 19, 2018
339c3ca
Improved check_args method.
Evildoor Nov 20, 2018
1a56cd0
Removed unnecesary redefinition.
Evildoor Nov 20, 2018
dcbdeab
Reworked modes handling.
Evildoor Nov 20, 2018
3eaa413
Added long versions for eop and eom testing.
Evildoor Nov 20, 2018
1565684
Improved consistency: short version before long.
Evildoor Nov 20, 2018
be922c9
Added input files test.
Evildoor Nov 20, 2018
aa90f7c
Removed short version of override tests.
Evildoor Nov 20, 2018
cf56b0c
Moved override_hdfs_mode definition into a loop.
Evildoor Nov 20, 2018
8a37c7d
Improved readability in testing hdfs overrides.
Evildoor Nov 21, 2018
324978c
Moved repeating args definition into setUp().
Evildoor Nov 23, 2018
fdb498a
Added tests for config argument.
Evildoor Dec 14, 2018
42877e2
Improved config tests.
Evildoor Dec 17, 2018
9dc9aa0
Added 'incorrect' tests for mode, source and dest.
Evildoor Dec 18, 2018
19ca409
Improved the functions with 'short' argument.
Evildoor Dec 20, 2018
c3e4810
Updated tests for correct config.
Evildoor Jan 23, 2019
c81a096
Merge remote-tracking branch 'origin/pyDKB' into pyDKB-tests
Evildoor Apr 24, 2019
f795e24
Adapt tests to pyDKB changes.
Evildoor Apr 26, 2019
77ef71b
Add empty EOM tests.
Evildoor Apr 29, 2019
1d4feb2
Change value used to trigger an error.
Evildoor Apr 29, 2019
b5d6842
Rename a variable to improve readability.
Evildoor Apr 29, 2019
38a383e
Add raw strings processing test.
Evildoor Apr 29, 2019
c99f4c6
Replace repeating assignments with dict.update().
Evildoor Apr 29, 2019
e1df893
Add missing return value description.
Evildoor Apr 29, 2019
7dad261
Divide test_ProcessorStage.py per how-to: tests.
Evildoor Apr 30, 2019
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Empty file.
325 changes: 325 additions & 0 deletions Utils/Dataflow/pyDKB/dataflow/stage/tests/test_ProcessorStage.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,325 @@
#!/usr/bin/env python

"""
Tests for pyDKB.dataflow.stage.ProcessorStage.
Usage: 'python -m unittest discover' from ..
(directory with pyDKB.dataflow.stage code).
"""


import cStringIO
import os
import sys
import tempfile
import unittest


# Relative import inside of pyDKB prevents the use of simple 'import pyDKB'.
try:
base_dir = os.path.dirname(__file__) # Directory with this file
dkb_dir = os.path.join(base_dir, os.pardir) # stage directory
dkb_dir = os.path.join(dkb_dir, os.pardir) # dataflow directory
dkb_dir = os.path.join(dkb_dir, os.pardir) # pyDKB's directory
dkb_dir = os.path.join(dkb_dir, os.pardir) # pyDKB's parent directory
sys.path.append(dkb_dir)
import pyDKB
except Exception, err:
sys.stderr.write("(ERROR) Failed to import pyDKB library: %s\n" % err)
sys.exit(1)


def isolate_function_error(f, *args):
""" Silence and retrieve the function's error message.

The function is expected to throw a SystemExit when run with
specific arguments. Error stream is redirected into a string during the
function's execution, and the resulting messages can be analyzed.

:param f: function to execute
:type f: function
:param args: arguments to execute function with
:type args: list

:return:
:rtype:
"""
buf = cStringIO.StringIO()
temp_err = sys.stderr
sys.stderr = buf
try:
result = f(*args)
except SystemExit:
result = None
sys.stderr = temp_err
buf.seek(0)
msg = buf.read()
buf.close()
return [msg, result]


args_to_add = {
'source': ['f', 's', 'h'],
'dest': ['f', 's', 'h'],
}


modes = {
's': {'mode': 's', 'source': 's', 'dest': 's', 'eom': '\n', 'eop': '\0'},
'f': {'mode': 'f', 'source': 'f', 'dest': 'f', 'eom': '\n', 'eop': ''},
'm': {'mode': 'm', 'source': 's', 'dest': 's', 'eom': '\n', 'eop': ''},
}


class ProcessorStageArgsTestCase(unittest.TestCase):
default_args = {
'mode': 'f',
'config': None,
'eom': '\n',
'eop': '',
'source': 'f',
'dest': 'f',
'input_dir': os.curdir,
'output_dir': 'out',
'hdfs': False,
'input_files': []
}

def setUp(self):
self.stage = pyDKB.dataflow.stage.ProcessorStage()
self.args = dict(self.default_args)
Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Maybe name it expected_args (or exp_args)? Longer, right, but more readable... it`s just now it makes me remid myself every now and then how it is used.

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Done.


def tearDown(self):
self.stage = None
self.args = None

def check_args(self):
for a in self.args:
# Such kind of testing does not display the argument's name,
# hence the {a: ...} addition.
self.assertEqual({a: getattr(self.stage.ARGS, a)},
{a: self.args[a]})

def test_default(self):
self.stage.parse_args('')
self.check_args()

def test_hdfs(self):
self.stage.parse_args(['--hdfs'])
self.args['hdfs'] = True
self.args['source'] = 'h'
self.args['dest'] = 'h'
self.check_args()

def test_e(self):
self.stage.parse_args(['-e', '\t'])
self.args['eom'] = '\t'
self.check_args()

def test_end_of_message(self):
self.stage.parse_args(['--end-of-message', '\t'])
self.args['eom'] = '\t'
self.check_args()

def test_E(self):
self.stage.parse_args(['-E', '\t'])
self.args['eop'] = '\t'
self.check_args()

def test_end_of_process(self):
self.stage.parse_args(['--end-of-process', '\t'])
self.args['eop'] = '\t'
self.check_args()

def test_i(self):
self.stage.parse_args(['-i', 'something'])
self.args['input_dir'] = 'something'
self.check_args()

def test_input_dir(self):
self.stage.parse_args(['--input-dir', 'something'])
self.args['input_dir'] = 'something'
self.check_args()

def test_o(self):
self.stage.parse_args(['-o', 'something'])
self.args['output_dir'] = 'something'
self.check_args()

def test_output_dir(self):
self.stage.parse_args(['--output-dir', 'something'])
self.args['output_dir'] = 'something'
self.check_args()

def test_input_files(self):
self.stage.parse_args(['something', 'something_else'])
self.args['input_files'] = ['something', 'something_else']
self.check_args()


def add_arg(arg, val, short=False):
def f(self):
if short:
self.stage.parse_args(['-' + arg[0], val])
else:
self.stage.parse_args(['--' + arg, val])
self.args[arg] = val
self.check_args()
if short:
setattr(ProcessorStageArgsTestCase, 'test_%s_%s' % (arg[0], val), f)
else:
setattr(ProcessorStageArgsTestCase, 'test_%s_%s' % (arg, val), f)


def add_arg_incorrect(arg, short=False):
if short:
val = 'i'
Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Maybe it would be better to use here 'incorrect' as value instead of 'i'?
I have mentioned it earlier, but the comment was buried after push --force :) -- values for the parameters being tested are more likely to be one-char length, so using the longer word we are almost guaranteed from hitting a new valid value by chance.

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Done.

args = ['-' + arg[0], val]
fname = 'test_%s_%s' % (arg[0], val)
else:
val = 'incorrect'
args = ['--' + arg, val]
fname = 'test_%s_%s' % (arg, val)

def f(self):
[msg, result] = isolate_function_error(self.stage.parse_args, args)
err = "error: argument -%s/--%s: invalid choice: '%s'" % (arg[0],
arg, val)
self.assertIn(err, msg)
setattr(ProcessorStageArgsTestCase, fname, f)


def add_mode(val, short=False):
def f(self):
if short:
self.stage.parse_args(['-m', val])
else:
self.stage.parse_args(['--mode', val])
self.args.update(modes[val])
self.check_args()
if short:
setattr(ProcessorStageArgsTestCase, 'test_m_%s' % (val), f)
else:
setattr(ProcessorStageArgsTestCase, 'test_mode_%s' % (val), f)


# hdfs >> source-dest >> mode
def add_override_hdfs(arg, val):
def f(self):
self.stage.parse_args(['--hdfs', '--' + arg, val])
self.args[arg] = val
self.args['hdfs'] = True
self.args['source'] = 'h'
self.args['dest'] = 'h'
self.check_args()
setattr(ProcessorStageArgsTestCase,
'test_override_hdfs_%s_%s' % (arg, val), f)


def add_override_mode(arg, val, mode_val):
def f(self):
self.stage.parse_args(['--' + arg, val, '--mode', mode_val])
self.args.update(modes[mode_val])
self.args[arg] = val
self.check_args()
setattr(ProcessorStageArgsTestCase,
'test_override_%s_%s_mode_%s' % (arg, val, mode_val), f)


def add_override_hdfs_mode(val):
def f(self):
self.stage.parse_args(['--hdfs', '--mode', val])
self.args.update(modes[val])
self.args['hdfs'] = True
self.args['source'] = 'h'
self.args['dest'] = 'h'
self.check_args()
setattr(ProcessorStageArgsTestCase,
'test_override_hdfs_mode_%s' % (val), f)


for a in args_to_add:
for v in args_to_add[a]:
add_arg(a, v, True)
add_arg(a, v)
add_override_hdfs(a, v)
for m in modes:
add_override_mode(a, v, m)
add_arg_incorrect(a, True)
add_arg_incorrect(a)


for m in modes:
add_mode(m, True)
add_mode(m)
add_override_hdfs_mode(m)


add_arg_incorrect('mode', True)
add_arg_incorrect('mode')


class ProcessorStageConfigArgTestCase(unittest.TestCase):
def setUp(self):
self.stage = pyDKB.dataflow.stage.ProcessorStage()
self.fake_config = tempfile.NamedTemporaryFile(dir='.')

def tearDown(self):
self.stage = None
if not self.fake_config.closed:
self.fake_config.close()
self.fake_config = None

def test_correct_c(self):
self.stage.parse_args(['-c', self.fake_config.name])
self.assertIsNotNone(getattr(self.stage.ARGS, 'config'))

def test_correct_config(self):
self.stage.parse_args(['--config', self.fake_config.name])
self.assertIsNotNone(getattr(self.stage.ARGS, 'config'))

def test_missing_c(self):
self.fake_config.close()
[msg, result] = isolate_function_error(self.stage.parse_args,
['-c', self.fake_config.name])
err = "[Errno 2] No such file or directory: '%s'" %\
self.fake_config.name
self.assertIn(err, msg)

def test_missing_config(self):
self.fake_config.close()
[msg, result] = isolate_function_error(self.stage.parse_args,
['--config',
self.fake_config.name])
err = "[Errno 2] No such file or directory: '%s'" %\
self.fake_config.name
self.assertIn(err, msg)

def test_unreadable_c(self):
os.chmod(self.fake_config.name, 0300)
[msg, result] = isolate_function_error(self.stage.parse_args,
['-c', self.fake_config.name])
err = "[Errno 13] Permission denied: '%s'" %\
self.fake_config.name
self.assertIn(err, msg)

def test_unreadable_config(self):
os.chmod(self.fake_config.name, 0300)
[msg, result] = isolate_function_error(self.stage.parse_args,
['--config',
self.fake_config.name])
err = "[Errno 13] Permission denied: '%s'" %\
self.fake_config.name
self.assertIn(err, msg)


test_cases = (
ProcessorStageArgsTestCase,
ProcessorStageConfigArgTestCase,
)


def load_tests(loader, tests, pattern):
suite = unittest.TestSuite()
for case in test_cases:
suite.addTest(loader.loadTestsFromTestCase(case))
return suite