Skip to content
GitLab
Explore
Sign in
Primary navigation
Search or go to…
Project
SaQC
Manage
Activity
Members
Labels
Plan
Issues
36
Issue boards
Milestones
Wiki
Code
Merge requests
8
Repository
Branches
Commits
Tags
Repository graph
Compare revisions
Snippets
Build
Pipelines
Jobs
Pipeline schedules
Artifacts
Deploy
Releases
Container Registry
Model registry
Operate
Environments
Monitor
Incidents
Service Desk
Analyze
Value stream analytics
Contributor analytics
CI/CD analytics
Repository analytics
Model experiments
Help
Help
Support
GitLab documentation
Compare GitLab plans
Community forum
Contribute to GitLab
Provide feedback
Terms and privacy
Keyboard shortcuts
?
Snippets
Groups
Projects
Show more breadcrumbs
rdm-software
SaQC
Commits
80b82fb1
Commit
80b82fb1
authored
4 years ago
by
Bert Palm
🎇
Browse files
Options
Downloads
Patches
Plain Diff
fixed (generic) isflagged and its test
parent
ae00e0e2
No related branches found
No related tags found
4 merge requests
!271
Static expansion of regular expressions
,
!260
Follow-Up Translations
,
!237
Flagger Translations
,
!232
WIP: Fuzzy testing
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
saqc/funcs/generic.py
+23
-3
23 additions, 3 deletions
saqc/funcs/generic.py
test/funcs/test_generic_config_functions.py
+34
-29
34 additions, 29 deletions
test/funcs/test_generic_config_functions.py
with
57 additions
and
32 deletions
saqc/funcs/generic.py
+
23
−
3
View file @
80b82fb1
...
...
@@ -21,13 +21,33 @@ _OP = {'<': op.lt, '<=': op.le, '==': op.eq, '!=': op.ne, '>': op.gt, '>=': op.g
def
_dslIsFlagged
(
flagger
:
Flagger
,
var
:
pd
.
Series
,
flag
:
float
=
UNFLAGGED
,
comparator
:
str
=
"
>
"
flagger
:
Flagger
,
var
:
pd
.
Series
,
flag
:
float
=
None
,
comparator
:
str
=
None
)
->
Union
[
pd
.
Series
,
DictOfSeries
]:
"""
helper function for `flag`
Param Combinations
------------------
- ``isflagged(
'
var
'
)`` : show me (anything) flagged
- ``isflagged(
'
var
'
, DOUBT)`` : show me ``flags >= DOUBT``
- ``isflagged(
'
var
'
, DOUBT,
'
==
'
)`` : show me ``flags == DOUBT``
Raises
------
ValueError: if `comparator` is passed but no `flag` vaule. Eg. ``isflagged(
'
var
'
, comparator=
'
>=
'
)``
"""
comparison
=
_OP
[
comparator
]
return
comparison
(
flagger
[
var
.
name
],
flag
)
if
flag
is
None
:
if
comparator
is
not
None
:
raise
ValueError
(
'
if `comparator` is used, explicitly pass a `flag` level.
'
)
flag
=
UNFLAGGED
comparator
=
'
>
'
# default
if
comparator
is
None
:
comparator
=
'
>=
'
_op
=
_OP
[
comparator
]
return
_op
(
flagger
[
var
.
name
],
flag
)
def
_execGeneric
(
flagger
:
Flagger
,
data
:
DictOfSeries
,
func
:
Callable
[[
pd
.
Series
],
pd
.
Series
],
field
:
str
,
...
...
This diff is collapsed.
Click to expand it.
test/funcs/test_generic_config_functions.py
+
34
−
29
View file @
80b82fb1
...
...
@@ -2,22 +2,20 @@
# -*- coding: utf-8 -*-
import
ast
import
pytest
import
numpy
as
np
import
pandas
as
pd
from
dios
import
DictOfSeries
from
test.common
import
TESTFLAGGER
,
TESTNODATA
,
initData
,
writeIO
import
dios
from
saqc.common
import
*
from
saqc.flagger
import
Flagger
,
initFlagsLike
from
saqc.core.visitor
import
ConfigFunctionParser
from
saqc.core.config
import
Fields
as
F
from
saqc.core.register
import
register
from
saqc
import
SaQC
from
saqc.funcs.generic
import
_execGeneric
from
saqc
import
SaQC
from
test.common
import
TESTNODATA
,
initData
,
writeIO
@pytest.fixture
...
...
@@ -32,7 +30,7 @@ def data_diff():
col1
=
data
[
data
.
columns
[
1
]]
mid
=
len
(
col0
)
//
2
offset
=
len
(
col0
)
//
8
return
DictOfSeries
(
data
=
{
col0
.
name
:
col0
.
iloc
[:
mid
+
offset
],
col1
.
name
:
col1
.
iloc
[
mid
-
offset
:],})
return
dios
.
DictOfSeries
(
data
=
{
col0
.
name
:
col0
.
iloc
[:
mid
+
offset
],
col1
.
name
:
col1
.
iloc
[
mid
-
offset
:],})
def
_compileGeneric
(
expr
,
flagger
):
...
...
@@ -41,8 +39,8 @@ def _compileGeneric(expr, flagger):
return
kwargs
[
"
func
"
]
@pytest.mark.parametrize
(
"
flagger
"
,
TESTFLAGGER
)
def
test_missingIdentifier
(
data
,
f
lagger
)
:
def
test_missingIdentifier
(
data
):
flagger
=
F
lagger
(
)
# NOTE:
# - the error is only raised at runtime during parsing would be better
...
...
@@ -57,9 +55,8 @@ def test_missingIdentifier(data, flagger):
_execGeneric
(
flagger
,
data
,
func
,
field
=
""
,
nodata
=
np
.
nan
)
@pytest.mark.parametrize
(
"
flagger
"
,
TESTFLAGGER
)
def
test_syntaxError
(
flagger
):
def
test_syntaxError
():
flagger
=
Flagger
()
tests
=
[
"
range(x=5
"
,
"
rangex=5)
"
,
...
...
@@ -106,8 +103,7 @@ def test_comparisonOperators(data):
assert
np
.
all
(
result
==
expected
)
@pytest.mark.parametrize
(
"
flagger
"
,
TESTFLAGGER
)
def
test_arithmeticOperators
(
data
,
flagger
):
def
test_arithmeticOperators
(
data
):
flagger
=
initFlagsLike
(
data
)
var1
,
*
_
=
data
.
columns
this
=
data
[
var1
]
...
...
@@ -127,8 +123,7 @@ def test_arithmeticOperators(data, flagger):
assert
np
.
all
(
result
==
expected
)
@pytest.mark.parametrize
(
"
flagger
"
,
TESTFLAGGER
)
def
test_nonReduncingBuiltins
(
data
,
flagger
):
def
test_nonReduncingBuiltins
(
data
):
flagger
=
initFlagsLike
(
data
)
var1
,
*
_
=
data
.
columns
this
=
var1
...
...
@@ -147,10 +142,8 @@ def test_nonReduncingBuiltins(data, flagger):
assert
(
result
==
expected
).
all
()
@pytest.mark.parametrize
(
"
flagger
"
,
TESTFLAGGER
)
@pytest.mark.parametrize
(
"
nodata
"
,
TESTNODATA
)
def
test_reduncingBuiltins
(
data
,
flagger
,
nodata
):
def
test_reduncingBuiltins
(
data
,
nodata
):
data
.
loc
[::
4
]
=
nodata
flagger
=
initFlagsLike
(
data
)
var1
=
data
.
columns
[
0
]
...
...
@@ -171,10 +164,10 @@ def test_reduncingBuiltins(data, flagger, nodata):
assert
result
==
expected
@pytest.mark.parametrize
(
"
flagger
"
,
TESTFLAGGER
)
@pytest.mark.parametrize
(
"
nodata
"
,
TESTNODATA
)
def
test_ismissing
(
data
,
flagger
,
nodata
):
def
test_ismissing
(
data
,
nodata
):
flagger
=
initFlagsLike
(
data
)
data
.
iloc
[:
len
(
data
)
//
2
,
0
]
=
np
.
nan
data
.
iloc
[(
len
(
data
)
//
2
)
+
1
:,
0
]
=
-
9999
this
=
data
.
iloc
[:,
0
]
...
...
@@ -190,9 +183,8 @@ def test_ismissing(data, flagger, nodata):
assert
np
.
all
(
result
==
expected
)
@pytest.mark.parametrize
(
"
flagger
"
,
TESTFLAGGER
)
@pytest.mark.parametrize
(
"
nodata
"
,
TESTNODATA
)
def
test_bitOps
(
data
,
flagger
,
nodata
):
def
test_bitOps
(
data
,
nodata
):
var1
,
var2
,
*
_
=
data
.
columns
this
=
var1
...
...
@@ -220,14 +212,26 @@ def test_isflagged(data):
(
f
"
isflagged(
{
var1
}
)
"
,
flagger
[
var1
]
>
UNFLAGGED
),
(
f
"
isflagged(
{
var1
}
, flag=BAD)
"
,
flagger
[
var1
]
>=
BAD
),
(
f
"
isflagged(
{
var1
}
, UNFLAGGED,
'
==
'
)
"
,
flagger
[
var1
]
==
UNFLAGGED
),
(
f
"
~isflagged(
{
var2
}
)
"
,
~
(
flagger
[
var2
]
>
UNFLAGGED
)
)
,
(
f
"
~(
{
var2
}
>999) & (~isflagged(
{
var2
}
))
"
,
~
(
data
[
var2
]
>
999
)
&
~
(
flagger
[
var2
]
>
UNFLAGGED
)),
(
f
"
~isflagged(
{
var2
}
)
"
,
flagger
[
var2
]
==
UNFLAGGED
),
(
f
"
~(
{
var2
}
>999) & (~isflagged(
{
var2
}
))
"
,
~
(
data
[
var2
]
>
999
)
&
(
flagger
[
var2
]
==
UNFLAGGED
)),
]
for
test
,
expected
in
tests
:
func
=
_compileGeneric
(
f
"
generic.flag(func=
{
test
}
, flag=BAD)
"
,
flagger
)
result
=
_execGeneric
(
flagger
,
data
,
func
,
field
=
None
,
nodata
=
np
.
nan
)
assert
np
.
all
(
result
==
expected
)
for
i
,
(
test
,
expected
)
in
enumerate
(
tests
):
try
:
func
=
_compileGeneric
(
f
"
generic.flag(func=
{
test
}
, flag=BAD)
"
,
flagger
)
result
=
_execGeneric
(
flagger
,
data
,
func
,
field
=
None
,
nodata
=
np
.
nan
)
assert
np
.
all
(
result
==
expected
)
except
Exception
:
print
(
i
,
test
)
raise
# test bad combination
for
comp
in
[
'
>
'
,
'
>=
'
,
'
==
'
,
'
!=
'
,
'
<
'
,
'
<=
'
]:
fails
=
f
"
isflagged(
{
var1
}
, comparator=
'
{
comp
}
'
)
"
func
=
_compileGeneric
(
f
"
generic.flag(func=
{
fails
}
, flag=BAD)
"
,
flagger
)
with
pytest
.
raises
(
ValueError
):
_execGeneric
(
flagger
,
data
,
func
,
field
=
None
,
nodata
=
np
.
nan
)
def
test_variableAssignments
(
data
):
...
...
@@ -249,6 +253,7 @@ def test_variableAssignments(data):
assert
set
(
result_flagger
.
columns
)
==
set
(
data
.
columns
)
|
{
"
dummy1
"
,
"
dummy2
"
}
# TODO: why this must(!) fail ? - a comment would be helpful
@pytest.mark.xfail
(
strict
=
True
)
def
test_processMultiple
(
data_diff
):
var1
,
var2
,
*
_
=
data_diff
.
columns
...
...
This diff is collapsed.
Click to expand it.
Preview
0%
Loading
Try again
or
attach a new file
.
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Save comment
Cancel
Please
register
or
sign in
to comment