Skip to content
GitLab
Explore
Sign in
Primary navigation
Search or go to…
Project
SaQC
Manage
Activity
Members
Labels
Plan
Issues
36
Issue boards
Milestones
Wiki
Code
Merge requests
8
Repository
Branches
Commits
Tags
Repository graph
Compare revisions
Snippets
Build
Pipelines
Jobs
Pipeline schedules
Artifacts
Deploy
Releases
Container Registry
Model registry
Operate
Environments
Monitor
Incidents
Service Desk
Analyze
Value stream analytics
Contributor analytics
CI/CD analytics
Repository analytics
Model experiments
Help
Help
Support
GitLab documentation
Compare GitLab plans
Community forum
Contribute to GitLab
Provide feedback
Terms and privacy
Keyboard shortcuts
?
Snippets
Groups
Projects
Show more breadcrumbs
rdm-software
SaQC
Commits
2b7996b2
Commit
2b7996b2
authored
5 years ago
by
David Schäfer
Browse files
Options
Downloads
Plain Diff
Merge branch 'master' of
https://git.ufz.de/rdm/saqc
parents
7dd0a099
0cceb862
No related branches found
Branches containing commit
No related tags found
Tags containing commit
No related merge requests found
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
flagger/dmpflagger.py
+18
-2
18 additions, 2 deletions
flagger/dmpflagger.py
funcs/functions.py
+37
-8
37 additions, 8 deletions
funcs/functions.py
with
55 additions
and
10 deletions
flagger/dmpflagger.py
+
18
−
2
View file @
2b7996b2
#! /usr/bin/env python
# -*- coding: utf-8 -*-
import
subprocess
import
pandas
as
pd
from
.baseflagger
import
BaseFlagger
class
Keywords
:
VERSION
=
"
$version
"
class
FlagFields
:
FLAG
=
"
quality_flag
"
CAUSE
=
"
quality_cause
"
...
...
@@ -24,6 +29,8 @@ class DmpFlagger(BaseFlagger):
def
__init__
(
self
):
super
().
__init__
(
FLAGS
)
self
.
flag_fields
=
[
FlagFields
.
FLAG
,
FlagFields
.
CAUSE
,
FlagFields
.
COMMENT
]
version
=
subprocess
.
check_output
(
'
git describe --tags --always --dirty
'
.
split
())
self
.
project_version
=
version
.
decode
().
strip
()
def
initFlags
(
self
,
data
,
**
kwargs
):
columns
=
data
.
columns
if
isinstance
(
data
,
pd
.
DataFrame
)
else
[
data
.
name
]
...
...
@@ -48,6 +55,9 @@ class DmpFlagger(BaseFlagger):
else
:
self
.
_checkFlag
(
flag
)
if
Keywords
.
VERSION
in
comment
:
comment
=
comment
.
replace
(
Keywords
.
VERSION
,
self
.
project_version
)
flags
=
self
.
_reduceColumns
(
flags
)
mask
=
flags
[
FlagFields
.
FLAG
]
<
flag
flags
.
loc
[
mask
,
self
.
flag_fields
]
=
flag
,
cause
,
comment
...
...
@@ -60,7 +70,13 @@ class DmpFlagger(BaseFlagger):
return
super
().
isFlagged
(
flagcol
,
flag
)
def
_reduceColumns
(
self
,
flags
):
flags
=
flags
.
copy
()
if
isinstance
(
flags
.
columns
,
pd
.
MultiIndex
):
if
set
(
flags
.
columns
)
==
set
(
self
.
flag_fields
):
pass
elif
isinstance
(
flags
,
pd
.
DataFrame
)
\
and
isinstance
(
flags
.
columns
,
pd
.
MultiIndex
)
\
and
(
len
(
flags
.
columns
)
==
3
):
flags
=
flags
.
copy
()
flags
.
columns
=
flags
.
columns
.
get_level_values
(
ColumnLevels
.
FLAGS
)
else
:
raise
TypeError
return
flags
This diff is collapsed.
Click to expand it.
funcs/functions.py
+
37
−
8
View file @
2b7996b2
...
...
@@ -15,7 +15,8 @@ def flagDispatch(func_name, *args, **kwargs):
"
mad
"
:
flagMad
,
"
constant
"
:
flagConstant
,
"
range
"
:
flagRange
,
"
generic
"
:
flagGeneric
}
"
generic
"
:
flagGeneric
,
"
soilMoistureByFrost
"
:
flagSoilMoistureBySoilFrost
}
func
=
func_map
.
get
(
func_name
,
None
)
if
func
is
not
None
:
...
...
@@ -124,17 +125,11 @@ def flagSoilMoistureBySoilFrost(data, flags, field, flagger, soil_temp_reference
:param frost_level: Value level, the flagger shall check against, when evaluating soil frost level.
"""
# TODO: (To ASK):HOW TO FLAG nan values in input frame? general question: what should a test test?
# TODO: -> nan values with reference values that show frost, are flagged bad, nan values with reference value nan
# TODO: as well, are not flagged (test not applicable-> no flag)
# TODO: puffer zone for intermediate/fluktuating frost state
# retrieve data series input:
dataseries
=
pd
.
Series
(
data
[
field
].
values
,
index
=
pd
.
to_datetime
(
data
.
index
))
# retrieve reference input:
# if reference is a string, it refers to data field
# if reference series is part of input data frame, evaluate input data flags:
flag_mask
=
flagger
.
isFlagged
(
flags
)[
soil_temp_reference
]
# retrieve reference series
...
...
@@ -168,3 +163,37 @@ def flagSoilMoistureBySoilFrost(data, flags, field, flagger, soil_temp_reference
flags
.
loc
[
mask
.
values
,
field
]
=
flagger
.
setFlag
(
flags
.
loc
[
mask
,
field
],
**
kwargs
)
return
data
,
flags
def
flagSoilMoistureByPrecipitationEvents
(
data
,
flags
,
field
,
flagger
,
precipitation_reference
,
sensor_meas_depth
=
0
,
sensor_accuracy
=
0
,
soil_porosity
=
0
,
**
kwargs
):
"""
Function flags Soil moisture measurements by flagging moisture rises that do not follow up a sufficient
precipitation event. If measurement depth, sensor accuracy of the soil moisture sensor and the porosity of the
surrounding soil is passed to the function, an inferior level of precipitation, that has to preceed a significant
moisture raise within 24 hours, can be estimated. If those values are not delivered, this inferior bound is set
to zero. In that case, any non zero precipitation count will justify any soil moisture raise.
:param data: The pandas dataframe, holding the data-to-be flagged.
:param flags: A dataframe holding the flags/flag-entries associated with
"
data
"
.
:param field: Fieldname of the Soil moisture measurements field in data.
:param flagger: A flagger - object.
:param precipitation_reference: Fieldname of the precipitation meassurements in data.
:param sensor_meas_depth: Measurement depth of the soil moisture sensor in meter [m].
:param sensor_accuracy: Accuracy of the soil moisture sensor [-].
:param soil_porosity: Porosity of moisture sensors surrounding soil.
"""
# retrieve data series input:
dataseries
=
pd
.
Series
(
data
[
field
].
values
,
index
=
pd
.
to_datetime
(
data
.
index
))
# if reference series is part of input data frame, evaluate input data flags:
flag_mask
=
flagger
.
isFlagged
(
flags
)[
precipitation_reference
]
# retrieve reference series
refseries
=
pd
.
Series
(
data
[
precipitation_reference
].
values
,
index
=
pd
.
to_datetime
(
data
.
index
))
# drop flagged values:
refseries
=
refseries
.
loc
[
~
np
.
array
(
flag_mask
)]
# make refseries index a datetime thingy
refseries
.
index
=
pd
.
to_datetime
(
refseries
.
index
)
# drop nan values from reference series, since those are values you dont want to refer to.
refseries
=
refseries
.
dropna
()
This diff is collapsed.
Click to expand it.
Preview
0%
Loading
Try again
or
attach a new file
.
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Save comment
Cancel
Please
register
or
sign in
to comment