add initial tests and project boilerplate

json2d · json2d · commit 0a388ce00bce · 2020-03-03T19:01:51.000-05:00
+ docker containers for running tests
diff --git a/.gitignore b/.gitignore
@@ -1,3 +1,5 @@
+.vscode
+
 # Byte-compiled / optimized / DLL files
 __pycache__/
 *.py[cod]
diff --git a/README.md b/README.md
@@ -8,41 +8,53 @@ import validframe as vf
 
 df = pd.DataFrame([
   ['a','b'], # headers
-  [1,2], # row 1
-  [1, None] # row 2
-  [1, 'hello'] # row 3
-  [1, 3.14] # row 4
+  [1, 1], # row 10
+  [1, None] # row 1
+  [1, 'hello'] # row 2
+  [1, 3.14] # row 3
 ])
 
-err_msg = "you wont see this error"
-err_msg = "you wont see this error"
+vf.validator(lambda x: , col='a')(df)
 
-assert vf.not_negative()(df), "you wont see this error"
-assert vf.not_empty()(df), "you will see this error"
+# validate that all cells that are numbers are also positive
+vf.validator(lambda x: x>0, filter=lambda x: isinstance(x, Number) )(df)
 
-assert vf.not_empty(row=0)(df), "you wont see this error"
-assert vf.not_empty(row=1)(df), "you will see this error"
-assert vf.not_empty(col='a')(df), "you wont see this error"
-assert vf.not_empty(col='b')(df), "you will see this error"
 
-assert vf.totals(4, col='a')(df), "you won't see this error"
-assert vf.min(0, col='a')(df), "you won't see this error"
-assert vf.max(2, col='a')(df), "you won't see this error"
+vf.positive()(df) # AssertionError
+vf.not_empty()(df) # AssertionError
+vf.empty()(df) # AssertionError
 
-assert vf.ints(col='a')(df), "you won't see this error"
-assert vf.ints(col='b')(df), "you will see this error"
+vf.not_empty(row=0)(df)
+vf.not_empty(row=1)(df) # AssertionError
+vf.not_empty(col='a')(df)
+vf.not_empty(col='b')(df) # AssertionError
 
-assert vf.strs(col='b', row=3)(df), "you won't see this error"
-assert vf.floats(col='b', row=4)(df), "you won't see this error"
+vf.empty(col='b', row=1)(df)
+vf.empty(col='b')(df) # AssertionError
 
-assert vf.validate(lambda x: x.isnumeric, col='a')(df), "you won't see this error"
+vf.min(0, col='a')(df)
+vf.max(2, col='a')(df)
+
+vf.ints(col='a')(df)
+vf.ints(row=0)(df)
+vf.ints(col='b')(df) # AssertionError
+
+vf.strs(col='b', row=3)(df)
+vf.floats(col='b', row=4)(df)
+
+vf.totals(4, col='a')(df)
 
-# validate that all cells that are numbers are positive
-assert vf.validate(lambda x: x>0, filter=lambda x: x.isnumeric() )(df), "you won't see this error"
 ```
 
 ### boycotting lambdas? 
 use functions instead
-```
-def 
+```py
+def is_cell_foo(x):
+  foo = (None, str, int, float)
+  return isinstance(x, foo)
+
+validate_is_cells_foo = vf.validator(is_cell_foo)
+
+validate_is_cells_foo(df)
 
+```
diff --git a/docker-compose.shell.yml b/docker-compose.shell.yml
@@ -0,0 +1,11 @@
+version: '3'
+services:
+  test-runner:
+    build: 
+      context: .
+      dockerfile: python3.Dockerfile
+    command: python
+    volumes:
+     - .:/app
+    stdin_open: true
+    tty: true
diff --git a/docker-compose.test-runner.yml b/docker-compose.test-runner.yml
@@ -0,0 +1,20 @@
+version: '3'
+services:
+  test-runner:
+    build: 
+      context: .
+      dockerfile: python3.Dockerfile
+    command: python tests/units.py
+    volumes:
+     - .:/app
+    stdin_open: true
+    tty: true
+  test-runner-2:
+    build: 
+      context: .
+      dockerfile: python2.Dockerfile
+    command: python tests/units.py
+    volumes:
+      - .:/app
+    stdin_open: true
+    tty: true
diff --git a/python2.Dockerfile b/python2.Dockerfile
@@ -0,0 +1,6 @@
+FROM python:2.7
+
+WORKDIR /app
+
+COPY requirements.txt ./
+RUN pip install --no-cache-dir -r requirements.txt
diff --git a/python3.Dockerfile b/python3.Dockerfile
@@ -0,0 +1,6 @@
+FROM python:3.8
+
+WORKDIR /app
+
+COPY requirements.txt ./
+RUN pip install --no-cache-dir -r requirements.txt
diff --git a/requirements.txt b/requirements.txt
@@ -0,0 +1 @@
+pandas==1.0.1
diff --git a/tests/units.py b/tests/units.py
@@ -0,0 +1,190 @@
+import sys
+from os import path
+sys.path.append( path.dirname( path.dirname( path.abspath(__file__) ) ) )
+
+from datetime import timedelta, datetime
+
+from numbers import Number
+
+# from helpers import *
+
+# from functools import reduce
+
+import unittest
+
+import pandas as pd
+
+import validframe as vf
+
+class TestEverything(unittest.TestCase):
+
+  # use `_test` prefix isntead of `test` (w/o leading underscore) so test runner doesn't use it
+  def _test_should_fail(self, fail_validators, df):
+    for validate in fail_validators:
+      with self.assertRaises(AssertionError):
+        validate(df)
+
+  def _test_should_pass(self, pass_validators, df):
+    try:
+      for validate in pass_validators:
+        validate(df)
+    except:
+      self.fail('validation should have passed but exception was raised')
+
+  def test_base(self):
+
+    df = pd.DataFrame(
+      columns = ['a','b'],
+      data = [
+        [1, -42], # row 1
+        [1, None], # row 2
+        [1, None], # row 3
+        [1, 3.14], # row 4
+      ])
+    
+    class Mystery():
+      pass
+
+    pass_validators = [
+      vf.validator(lambda x: not isinstance(x, Mystery)),
+      vf.validator(lambda x: x is None or x >= -42),
+      vf.validator(lambda x: x == 1, col='a'),
+      vf.validator(lambda x: x == 1, row=[0, 3]),
+
+      vf.validator(lambda x: x == -42 or x == 3.14, col='b', row=[0, 3]),
+      vf.validator(lambda x: x == 1, col=['a'], row=[0, 3]),
+      
+      vf.validator(lambda x: x == 1 or x == -42, filter=lambda x: isinstance(x, int)),
+      vf.validator(lambda x: x is None, filter=lambda x: not isinstance(x, Number)),
+      
+      vf.validator(lambda x: x == -42, col='b', filter=lambda x: isinstance(x, int)),
+      vf.validator(lambda x: x == -42, col='b', row=[0,1,2], filter=lambda x: isinstance(x, int))
+    ]
+
+    self._test_should_pass(pass_validators, df)
+
+    fail_validators = [
+      vf.validator(lambda x: isinstance(x, Number)), # all cells are numbers
+      vf.validator(lambda x: isinstance(x, Number), col='b'), # all cells in col 'a' are numbers
+      vf.validator(lambda x: isinstance(x, Number), col=['b']), # all cells in col 'a' are numbers
+
+      vf.validator(lambda x: x < 0, row=0), # all cells in row 0 and 3 are negative (and numbers)
+      vf.validator(lambda x: x < 0, row=[0, 3]), # all cells in row 0 and 3 are negative (and numbers)
+      vf.validator(lambda x: x < 0, col='b', row=[0, 3]),
+      vf.validator(lambda x: x < 0, col=['a'], row=[0, 3]),
+
+      vf.validator(lambda x: x < 0, filter=lambda x: isinstance(x, Number)),
+      vf.validator(lambda x: x < 0, col=['b'], row=[4,3,1], filter=lambda x: isinstance(x, float))
+    ]
+
+    self._test_should_fail(fail_validators, df)
+
+
+  def test_mappers(self):
+
+    df = pd.DataFrame(
+      columns = ['a', 'b', 'c'], # headers
+      data = [
+        ['a', 'b', 'c'], # headers
+        [1, -42, 'hello'], # row 0
+        [1, None, 'world'], # row 1
+        [1, None, 'ciao'], # row 2
+        [1, 3.14, 'mondo'], # row 3
+      ])
+
+    pass_validators = [
+      vf.positive(col='a'),
+      vf.negative(col='b', row=0),
+      vf.empty(col='b', row=[1,2]),
+      vf.not_empty(col=['a','c'], row=[0,3]),
+      vf.min(0, col=['a','b'], row=3),
+      vf.max(3,14, col=['a','b'], row=3),
+      vf.minmax(-42, 3.14, filter=lambda x : isinstance(x, Number)),
+      vf.ints(col='a'),
+      vf.floats(col='b', row=3),
+      vf.strs(col='c'), 
+    ]
+
+    self._test_should_pass(pass_validators, df)
+
+
+    fail_validators = [
+      vf.positive(col='b', row=0),
+      vf.negative(col='a'),
+      vf.empty(col=['a','c'], row=[0,3]),
+      vf.not_empty(col='b', row=[1,2]),
+      vf.min(3.14, col=['a','b'], row=3),
+      vf.max(0, col=['a','b'], row=3),
+      vf.minmax(0, 2, filter=lambda x : isinstance(x, Number)),
+      vf.ints(col='b'),
+      vf.floats(col='a'),
+      vf.strs(row=3), 
+    ]
+
+
+    self._test_should_fail(fail_validators, df)
+
+  def test_reducers(self):
+
+    df = pd.DataFrame(
+      columns = ['a', 'b', 'c'], # headers
+      data = [
+        [1, -42, 'hello'], # row 0
+        [1, None, 'world'], # row 1
+        [1, None, 'ciao'], # row 2
+        [1, 3.14, 'mondo'] # row 3
+      ])
+
+
+    pass_validators = [
+      vf.totals(4, col='a'), 
+      vf.totals(-41, col=['a','b'], row=0), 
+      vf.totals(3.14, col=['a','b'], row=[0,3]), 
+      vf.totals(-38, filter=lambda x : isinstance(x, int)), 
+      vf.totals(7.14, filter=lambda x : isinstance(x, Number) and x > 0), 
+    ]
+
+    self._test_should_pass(pass_validators, df)
+
+
+    fail_validators = [
+      vf.totals(100, col='a'), 
+      vf.totals(1, row=1), # theres a None in this row
+      vf.totals('gg', col='c'), 
+    ]
+
+    self._test_should_fail(fail_validators, df)
+
+
+  def test_with_datetime(self):
+
+    some_day = datetime(2020, 1, 6)
+
+    df = pd.DataFrame(
+      columns = ['net_amount', 'product_name', 'trn_date'], # headers
+      data = [        
+        [5.50, 'canoli', some_day], # row 0
+        [9.50, 'tiramisu', some_day + timedelta(hours=1)], # row 1
+        [10, 'salad', some_day + timedelta(hours=2)], # row 2
+        [10, 'bread', some_day + timedelta(days=1)], # row 3
+      ])
+
+    pass_validators = [
+      vf.minmax(some_day, some_day + timedelta(days=1), col='trn_date'),
+      vf.min(some_day, col='trn_date'),
+      vf.max(some_day + timedelta(days=2), col='trn_date'),
+    ]
+
+    self._test_should_pass(pass_validators, df)
+
+
+    fail_validators = [
+      vf.minmax(some_day - timedelta(days=1), some_day, col='trn_date'),
+      vf.min(some_day + timedelta(hours=2), col='trn_date'),
+      vf.max(some_day + timedelta(hours=2), col='trn_date'),
+    ]
+
+    self._test_should_fail(fail_validators, df)
+
+
+unittest.main()
diff --git a/validframe/__init__.py b/validframe/__init__.py
@@ -0,0 +1 @@
+from .core import *
diff --git a/validframe/core.py b/validframe/core.py
@@ -0,0 +1,15 @@
+def validator(validate_cell, col=None, row=None, filter=None):
+
+  assert callable(validate_cell), 'validate_cell arg must be callable'
+
+  def validate_df(df, **kwargs): 
+    # assert any(df.applymap( ... )
+    raise NotImplementedError
+
+  return validate_df
+
+def positive(**kwargs):
+  return validator(lambda x : x > 0, **kwargs)
+
+# or with just lambdas
+negative = lambda **kwargs : validator(lambda x: x < 0, **kwargs)

Original file line number	Diff line number	Diff line change
`@@ -1,3 +1,5 @@`
	`1`	`+.vscode`
	`2`	`+`
`1`	`3`	`# Byte-compiled / optimized / DLL files`
`2`	`4`	`__pycache__/`
`3`	`5`	`*.py[cod]`