Skip to content
GitLab
Explore
Sign in
Primary navigation
Search or go to…
Project
dios
Manage
Activity
Members
Labels
Plan
Issues
11
Issue boards
Milestones
Wiki
Jira
Code
Merge requests
0
Repository
Branches
Commits
Tags
Repository graph
Compare revisions
Snippets
Build
Pipelines
Jobs
Pipeline schedules
Artifacts
Deploy
Releases
Container Registry
Model registry
Operate
Environments
Monitor
Incidents
Service Desk
Analyze
Value stream analytics
Contributor analytics
CI/CD analytics
Repository analytics
Model experiments
Help
Help
Support
GitLab documentation
Compare GitLab plans
Community forum
Contribute to GitLab
Provide feedback
Terms and privacy
Keyboard shortcuts
?
Snippets
Groups
Projects
Show more breadcrumbs
RDM
dios
Commits
9c5413d3
Commit
9c5413d3
authored
5 years ago
by
Bert Palm
🎇
Browse files
Options
Downloads
Patches
Plain Diff
added .iloc
parent
a1eb979b
No related branches found
Branches containing commit
No related tags found
Tags containing commit
2 merge requests
!2
Develop
,
!1
complete rework
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
dios/__init__.py
+0
-3
0 additions, 3 deletions
dios/__init__.py
dios/dios.py
+103
-16
103 additions, 16 deletions
dios/dios.py
tests/run_dios.py
+2
-2
2 additions, 2 deletions
tests/run_dios.py
with
105 additions
and
21 deletions
dios/__init__.py
+
0
−
3
View file @
9c5413d3
from
dios.dios
import
*
from
dios.profiling.generate_testsets
import
get_testset
,
var_prefix
from
dios.profiling.performance
import
gen_random_timestamps
,
find_index_range
This diff is collapsed.
Click to expand it.
dios/dios.py
+
103
−
16
View file @
9c5413d3
...
...
@@ -8,14 +8,22 @@ import datetime as dt
from
collections
import
OrderedDict
from
pandas.core.dtypes.common
import
(
is_list_like
,
is_iterator
,
is_scalar
,
is_number
,
is_integer
,
)
from
pandas.core.dtypes.common
import
is_iterator
as
_is_iterator
from
pandas.core.indexing
import
need_slice
def
is_iterator
(
obj
):
"""
This is only a dummy wrapper, to warn that the docu of this isnt
'
t right.
Unlike the example says,
>>is_iterator([1, 2, 3])
returns False, not True for lists
"""
return
_is_iterator
(
obj
)
class
DictOfSeries
:
"""
DictionaryOfSeries is a collection of pd.Series
'
s which aim to be as close as possible similar to
...
...
@@ -198,6 +206,9 @@ class DictOfSeries:
if
isinstance
(
value
,
DictOfSeries
):
self
.
_setitem_dios
(
keys
,
slicer
,
value
)
else
:
if
is_iterator
(
value
):
value
=
list
(
value
)
for
k
in
keys
:
self
.
_setitem
(
k
,
value
,
slicer
)
...
...
@@ -228,18 +239,19 @@ class DictOfSeries:
return
sl
=
sl
or
slice
(
None
)
item
=
self
.
_data
[
key
]
# label, scalar: dios['a'] = 3.9 or
# slice, scalar: dios[0:3] = 4.0
if
is_scalar
(
val
):
self
.
_data
[
key
]
[
sl
]
=
val
item
[
sl
]
=
val
# label, list: dios['a'] = [0.0, 0.3, 0.0]
# sclice, list: dios[0:3] = [0.0, 0.3, 0.0]
elif
is_list_like
(
val
):
# ensure same size
if
len
(
self
.
_data
[
key
])
==
len
(
val
):
self
.
_data
[
key
]
[
sl
]
=
val
# ensure same size
# fixme: is this neccessary, wouldnt pd.Series raise a Valuerror ?
if
len
(
item
[
sl
])
==
len
(
val
):
item
[
sl
]
=
val
else
:
raise
ValueError
(
f
'
Length of values does not match length of index for the key
{
key
}
'
)
else
:
...
...
@@ -255,6 +267,10 @@ class DictOfSeries:
def
loc
(
self
):
return
_LocIndexer
(
self
)
@property
def
iloc
(
self
):
return
_iLocIndexer
(
self
)
def
__str__
(
self
):
return
self
.
__repr__
()
...
...
@@ -496,17 +512,38 @@ class DictOfSeries:
return
news
.
squeeze
()
class
_LocIndexer
:
class
_Indexer
:
def
__init__
(
self
,
_dios
):
self
.
_dios
=
_dios
# short handles
self
.
_data
=
_dios
.
_data
class
_LocIndexer
(
_Indexer
):
def
__init__
(
self
,
_dios
):
super
().
__init__
(
_dios
)
self
.
_check_keys
=
_dios
.
_check_keys
def
__getitem__
(
self
,
key
):
# if we have a tuple, we have rows and columns
# if not we have only rows and work on all columns
rkey
,
cols
=
self
.
_unpack_key
(
key
)
new
=
DictOfSeries
()
for
c
in
cols
:
new
[
c
]
=
self
.
_data
[
c
].
loc
[
rkey
]
return
new
def
__setitem__
(
self
,
key
,
value
):
rkey
,
cols
=
self
.
_unpack_key
(
key
)
# todo: dios -> dios_to_dios, -> series
# scalar, -> automatically
# series, -> automatically
# list_like -> check length
for
c
in
cols
:
self
.
_data
[
c
].
loc
[
rkey
]
=
value
def
_unpack_key
(
self
,
key
):
# if we have a tuple, we have a rows- and a column-indexer
# if not, we only have a row-indexer and work on all columns
if
isinstance
(
key
,
tuple
):
rkey
,
ckey
,
*
fail
=
key
if
fail
:
...
...
@@ -530,12 +567,7 @@ class _LocIndexer:
else
:
cols
=
self
.
_data
.
keys
()
rkey
=
key
# pass the row-key directly to pd.Series.loc[row-key]
new
=
DictOfSeries
()
for
c
in
cols
:
new
[
c
]
=
self
.
_data
[
c
].
loc
[
rkey
]
return
new
return
rkey
,
cols
def
_col_slice_to_col_list
(
self
,
cslice
):
"""
see here:
...
...
@@ -552,3 +584,58 @@ class _LocIndexer:
return
keys
[
slice
(
start
,
stop
+
1
,
cslice
.
step
)]
class
_iLocIndexer
(
_Indexer
):
def
__getitem__
(
self
,
key
):
rkey
,
cols
=
self
.
_unpack_key
(
key
)
new
=
DictOfSeries
()
for
c
in
cols
:
new
[
c
]
=
self
.
_data
[
c
].
iloc
[
rkey
]
return
new
def
_unpack_key
(
self
,
key
):
# if we have a tuple, we have a rows- and a column-indexer
# if not, we only have a row-indexer and work on all columns
if
isinstance
(
key
,
tuple
):
rkey
,
ckey
,
*
fail
=
key
if
fail
:
raise
KeyError
(
"
To many indexers
"
)
# prepare ckey
if
is_iterator
(
ckey
):
ckey
=
list
(
ckey
)
# determine columns
if
is_integer
(
ckey
):
self
.
_check_keys
([
ckey
])
cols
=
self
.
_integers_to_col_list
([
ckey
])
elif
isinstance
(
ckey
,
slice
):
cols
=
self
.
_col_slice_to_col_list
(
ckey
)
elif
is_list_like
(
ckey
):
self
.
_check_keys
(
ckey
)
cols
=
self
.
_integers_to_col_list
(
ckey
)
else
:
raise
KeyError
(
f
"
Type
{
type
(
ckey
)
}
is not supported for indexing on columns.
"
)
else
:
cols
=
self
.
_data
.
keys
()
rkey
=
key
return
rkey
,
cols
def
_check_keys
(
self
,
keys
):
bound
=
len
(
self
.
_data
)
for
k
in
keys
:
if
k
not
in
range
(
-
bound
,
bound
):
raise
KeyError
(
"
positional indexer(s) are out-of-bounds in columns
"
)
def
_integers_to_col_list
(
self
,
ints
):
klist
=
list
(
self
.
_data
.
keys
())
ks
=
set
()
for
i
in
ints
:
ks
.
add
(
klist
[
i
])
return
ks
def
_col_slice_to_col_list
(
self
,
sl
):
for
s
in
[
sl
.
start
,
sl
.
stop
,
sl
.
step
]:
if
not
is_integer
(
s
):
raise
TypeError
(
f
"
positional indexing with slice must be integers, passed was
{
s
}
of
{
type
(
s
)
}
"
)
return
list
(
self
.
_data
.
keys
())[
sl
]
This diff is collapsed.
Click to expand it.
tests/run_dios.py
+
2
−
2
View file @
9c5413d3
...
...
@@ -9,8 +9,8 @@ if __name__ == '__main__':
dios_options
[
Options
.
allow_mixed_indextypes
]
=
True
a
=
dios
.
loc
[:]
#
df = pd.DataFrame([1,24,5,456,45], index=pd.date_range(periods=5, freq='1d', start='2000-01-01'))
#
a = df.loc[
"2000-01-02":
]
df
=
pd
.
DataFrame
([
1
,
24
,
5
,
456
,
45
],
index
=
pd
.
date_range
(
periods
=
5
,
freq
=
'
1d
'
,
start
=
'
2000-01-01
'
))
a
=
df
.
i
loc
[
:,
0
]
print
(
a
)
exit
(
4
)
...
...
This diff is collapsed.
Click to expand it.
Preview
0%
Loading
Try again
or
attach a new file
.
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Save comment
Cancel
Please
register
or
sign in
to comment