Skip to content
GitLab
Explore
Sign in
Primary navigation
Search or go to…
Project
K
km3io
Manage
Activity
Members
Labels
Plan
Issues
Issue boards
Milestones
Code
Merge requests
Repository
Branches
Commits
Tags
Repository graph
Compare revisions
Snippets
Build
Pipelines
Jobs
Pipeline schedules
Artifacts
Deploy
Releases
Package Registry
Container Registry
Model registry
Operate
Environments
Terraform modules
Monitor
Incidents
Analyze
Value stream analytics
Contributor analytics
CI/CD analytics
Repository analytics
Model experiments
Help
Help
Support
GitLab documentation
Compare GitLab plans
Community forum
Contribute to GitLab
Provide feedback
Keyboard shortcuts
?
Snippets
Groups
Projects
Show more breadcrumbs
km3py
km3io
Merge requests
!47
Resolve "uproot4 integration"
Code
Review changes
Check out branch
Download
Patches
Plain diff
Merged
Resolve "uproot4 integration"
58-uproot4-integration-2
into
master
Overview
0
Commits
47
Pipelines
43
Changes
10
Merged
Tamas Gal
requested to merge
58-uproot4-integration-2
into
master
4 years ago
Overview
0
Commits
47
Pipelines
43
Changes
4
Expand
Closes
#58 (closed)
Edited
4 years ago
by
Tamas Gal
0
0
Merge request reports
Compare
version 30
version 41
89d0c2e9
4 years ago
version 40
c7355747
4 years ago
version 39
c92b061f
4 years ago
version 38
ff1c6c70
4 years ago
version 37
bf432120
4 years ago
version 36
a7e7244b
4 years ago
version 35
09b87761
4 years ago
version 34
79237108
4 years ago
version 33
27e9d8cd
4 years ago
version 32
080d9d54
4 years ago
version 31
6bdee7cb
4 years ago
version 30
f1af357f
4 years ago
version 29
b64bc8f5
4 years ago
version 28
483eab58
4 years ago
version 27
9b2c4b45
4 years ago
version 26
419d35a8
4 years ago
version 25
e13fc0a9
4 years ago
version 24
bd53990f
4 years ago
version 23
a56ed3af
4 years ago
version 22
d50fdb52
4 years ago
version 21
d80c1c33
4 years ago
version 20
26e549e0
4 years ago
version 19
2eb6c757
4 years ago
version 18
c3b7d044
4 years ago
version 17
3ddccf0a
4 years ago
version 16
8f2d8357
4 years ago
version 15
3cce5598
4 years ago
version 14
437c0bea
4 years ago
version 13
3ba9eccc
4 years ago
version 12
387225a8
4 years ago
version 11
000d7354
4 years ago
version 10
976019b8
4 years ago
version 9
0b6b8d86
4 years ago
version 8
0a3aad74
4 years ago
version 7
6b96db32
4 years ago
version 6
802be667
4 years ago
version 5
44bd42d3
4 years ago
version 4
2a6f1b71
4 years ago
version 3
ecf86b18
4 years ago
version 2
4bc26c9e
4 years ago
version 1
c8f1a399
4 years ago
master (base)
and
version 32
latest version
f26ee18a
47 commits,
4 years ago
version 41
89d0c2e9
46 commits,
4 years ago
version 40
c7355747
45 commits,
4 years ago
version 39
c92b061f
43 commits,
4 years ago
version 38
ff1c6c70
42 commits,
4 years ago
version 37
bf432120
41 commits,
4 years ago
version 36
a7e7244b
40 commits,
4 years ago
version 35
09b87761
39 commits,
4 years ago
version 34
79237108
37 commits,
4 years ago
version 33
27e9d8cd
36 commits,
4 years ago
version 32
080d9d54
35 commits,
4 years ago
version 31
6bdee7cb
34 commits,
4 years ago
version 30
f1af357f
33 commits,
4 years ago
version 29
b64bc8f5
31 commits,
4 years ago
version 28
483eab58
30 commits,
4 years ago
version 27
9b2c4b45
29 commits,
4 years ago
version 26
419d35a8
27 commits,
4 years ago
version 25
e13fc0a9
26 commits,
4 years ago
version 24
bd53990f
25 commits,
4 years ago
version 23
a56ed3af
24 commits,
4 years ago
version 22
d50fdb52
23 commits,
4 years ago
version 21
d80c1c33
22 commits,
4 years ago
version 20
26e549e0
20 commits,
4 years ago
version 19
2eb6c757
19 commits,
4 years ago
version 18
c3b7d044
18 commits,
4 years ago
version 17
3ddccf0a
17 commits,
4 years ago
version 16
8f2d8357
16 commits,
4 years ago
version 15
3cce5598
15 commits,
4 years ago
version 14
437c0bea
14 commits,
4 years ago
version 13
3ba9eccc
13 commits,
4 years ago
version 12
387225a8
12 commits,
4 years ago
version 11
000d7354
11 commits,
4 years ago
version 10
976019b8
10 commits,
4 years ago
version 9
0b6b8d86
9 commits,
4 years ago
version 8
0a3aad74
8 commits,
4 years ago
version 7
6b96db32
7 commits,
4 years ago
version 6
802be667
6 commits,
4 years ago
version 5
44bd42d3
5 commits,
4 years ago
version 4
2a6f1b71
4 commits,
4 years ago
version 3
ecf86b18
3 commits,
4 years ago
version 2
4bc26c9e
2 commits,
4 years ago
version 1
c8f1a399
1 commit,
4 years ago
Show latest version
4 files
+
89
−
32
Inline
Compare changes
Side-by-side
Inline
Show whitespace changes
Show one file at a time
Files
4
Search (e.g. *.vue) (Ctrl+P)
km3io/rootio.py
+
342
−
194
Options
#!/usr/bin/env python3
from
collections
import
namedtuple
import
numpy
as
np
import
awkward
as
ak
import
uproot
3
import
uproot
from
.tools
import
unfold_indices
# 110 MB based on the size of the largest basket found so far in km3net
BASKET_CACHE_SIZE
=
110
*
1024
**
2
BASKET_CACHE
=
uproot3
.
cache
.
ThreadSafeArrayCache
(
BASKET_CACHE_SIZE
)
class
BranchMapper
:
"""
Mapper helper for keys in a ROOT branch.
Parameters
----------
name: str
The name of the mapper helper which is displayed to the user
key: str
The key of the branch in the ROOT tree.
exclude: ``None``, ``list(str)``
Keys to exclude from parsing.
update: ``None``, ``dict(str: str)``
An update map for keys which are to be presented with a different
key to the user e.g. ``{
"
n_hits
"
:
"
hits
"
}`` will rename the ``hits``
key to ``n_hits``.
extra: ``None``, ``dict(str: str)``
An extra mapper for hidden object, primarily nested ones like
``t.fSec``, which can be revealed and mapped to e.g. ``t_sec``
via ``{
"
t_sec
"
,
"
t.fSec
"
}``.
attrparser: ``None``, ``function(str) -> str``
The function to be used to create attribute names. This is only
needed if unsupported characters are present, like ``.``, which
would prevent setting valid Python attribute names.
toawkward: ``None``, ``list(str)``
List of keys to convert to awkward arrays (recommended for
doubly ragged arrays)
"""
import
logging
def
__init__
(
self
,
name
,
key
,
extra
=
None
,
exclude
=
None
,
update
=
None
,
attrparser
=
None
,
flat
=
True
,
interpretations
=
None
,
toawkward
=
None
,
):
self
.
name
=
name
self
.
key
=
key
log
=
logging
.
getLogger
(
"
km3io.rootio
"
)
self
.
extra
=
{}
if
extra
is
None
else
extra
self
.
exclude
=
[]
if
exclude
is
None
else
exclude
self
.
update
=
{}
if
update
is
None
else
update
self
.
attrparser
=
(
lambda
x
:
x
)
if
attrparser
is
None
else
attrparser
self
.
flat
=
flat
self
.
interpretations
=
{}
if
interpretations
is
None
else
interpretations
self
.
toawkward
=
[]
if
toawkward
is
None
else
toawkward
class
EventReader
:
"""
reader for offline ROOT files
"""
class
Branch
:
"""
Branch accessor class
"""
event_path
=
None
item_name
=
"
Event
"
skip_keys
=
[]
# ignore these subbranches, even if they exist
aliases
=
{}
# top level aliases -> {fromkey: tokey}
nested_branches
=
{}
nested_aliases
=
{}
def
__init__
(
self
,
tree
,
mapper
,
f
,
index_chain
=
None
,
subbranchmaps
=
None
,
keymap
=
None
,
awkward_cache
=
None
,
step_size
=
2000
,
keys
=
None
,
aliases
=
None
,
nested_branches
=
None
,
event_ctor
=
None
,
):
self
.
_tree
=
tree
self
.
_mapper
=
mapper
self
.
_index_chain
=
[]
if
index_chain
is
None
else
index_chain
self
.
_keymap
=
None
self
.
_branch
=
tree
[
mapper
.
key
]
self
.
_subbranches
=
[]
self
.
_subbranchmaps
=
subbranchmaps
# FIXME preliminary cache to improve performance. Hopefully uproot4
# will fix this automatically!
self
.
_awkward_cache
=
{}
if
awkward_cache
is
None
else
awkward_cache
"""
EventReader base class
Parameters
----------
f : str or uproot4.reading.ReadOnlyDirectory (from uproot4.open)
Path to the file of interest or uproot4 filedescriptor.
step_size : int, optional
Number of events to read into the cache when iterating.
Choosing higher numbers may improve the speed but also increases
the memory overhead.
index_chain : list, optional
Keeps track of index chaining.
keys : list or set, optional
Branch keys.
aliases : dict, optional
Branch key aliases.
event_ctor : class or namedtuple, optional
Event constructor.
"""
if
isinstance
(
f
,
str
):
self
.
_fobj
=
uproot
.
open
(
f
)
self
.
_filepath
=
f
elif
isinstance
(
f
,
uproot
.
reading
.
ReadOnlyDirectory
):
self
.
_fobj
=
f
self
.
_filepath
=
f
.
_file
.
file_path
else
:
raise
TypeError
(
"
Unsupported file descriptor.
"
)
self
.
_step_size
=
step_size
self
.
_uuid
=
self
.
_fobj
.
_file
.
uuid
self
.
_iterator_index
=
0
self
.
_keys
=
keys
self
.
_event_ctor
=
event_ctor
self
.
_index_chain
=
[]
if
index_chain
is
None
else
index_chain
if
keymap
is
None
:
self
.
_initialise_keys
()
#
else
:
self
.
_keymap
=
keymap
if
subbranchmaps
is
not
None
:
for
mapper
in
subbranchmaps
:
subbranch
=
self
.
__class__
(
self
.
_tree
,
mapper
=
mapper
,
index_chain
=
self
.
_index_chain
,
awkward_cache
=
self
.
_awkward_cache
,
)
self
.
_subbranches
.
append
(
subbranch
)
for
subbranch
in
self
.
_subbranches
:
setattr
(
self
,
subbranch
.
_mapper
.
name
,
subbranch
)
if
aliases
is
not
None
:
self
.
aliases
=
aliases
if
nested_branches
is
not
None
:
self
.
nested_branches
=
nested_branches
if
self
.
_keys
is
None
:
self
.
_initialise_keys
()
if
self
.
_event_ctor
is
None
:
self
.
_event_ctor
=
namedtuple
(
self
.
item_name
,
set
(
list
(
self
.
keys
())
+
list
(
self
.
aliases
)
+
list
(
self
.
nested_branches
)
+
list
(
self
.
nested_aliases
)
),
)
def
_initialise_keys
(
self
):
"""
Create the keymap and instance attributes for branch keys
"""
# TODO: this could be a cached property
keys
=
set
(
k
.
decode
(
"
utf-8
"
)
for
k
in
self
.
_branch
.
keys
())
-
set
(
self
.
_mapper
.
exclude
skip_keys
=
set
(
self
.
skip_keys
)
all_keys
=
set
(
self
.
_fobj
[
self
.
event_path
].
keys
())
toplevel_keys
=
set
(
k
.
split
(
"
/
"
)[
0
]
for
k
in
all_keys
)
valid_aliases
=
{}
for
fromkey
,
tokey
in
self
.
aliases
.
items
():
if
tokey
in
all_keys
:
valid_aliases
[
fromkey
]
=
tokey
self
.
aliases
=
valid_aliases
keys
=
(
toplevel_keys
-
skip_keys
).
union
(
list
(
valid_aliases
)
+
list
(
self
.
nested_aliases
)
)
self
.
_keymap
=
{
**
{
self
.
_mapper
.
attrparser
(
k
):
k
for
k
in
keys
},
**
self
.
_mapper
.
extra
,
}
self
.
_keymap
.
update
(
self
.
_mapper
.
update
)
for
k
in
self
.
_mapper
.
update
.
values
():
del
self
.
_keymap
[
k
]
for
key
in
self
.
_keymap
.
keys
():
setattr
(
self
,
key
,
None
)
for
key
in
list
(
self
.
nested_branches
)
+
list
(
self
.
nested_aliases
):
keys
.
add
(
"
n_
"
+
key
)
# self._grouped_branches = {k for k in toplevel_keys - skip_keys if isinstance(self._fobj[self.event_path][k].interpretation, uproot.AsGrouped)}
valid_nested_branches
=
{}
for
nested_key
,
aliases
in
self
.
nested_branches
.
items
():
if
nested_key
in
toplevel_keys
:
valid_nested_branches
[
nested_key
]
=
{}
subbranch_keys
=
self
.
_fobj
[
self
.
event_path
][
nested_key
].
keys
()
for
fromkey
,
tokey
in
aliases
.
items
():
if
tokey
in
subbranch_keys
:
valid_nested_branches
[
nested_key
][
fromkey
]
=
tokey
self
.
nested_branches
=
valid_nested_branches
self
.
_keys
=
keys
def
__dir__
(
self
):
"""
Tab completion in IPython
"""
return
list
(
self
.
keys
())
+
[
"
header
"
]
def
keys
(
self
):
return
self
.
_keymap
.
keys
()
"""
Returns all accessible branch keys, without the skipped ones.
"""
return
self
.
_keys
def
__getattribute__
(
self
,
attr
):
if
attr
.
startswith
(
"
_
"
):
# let all private and magic methods pass
return
object
.
__getattribute__
(
self
,
attr
)
if
attr
in
self
.
_keymap
.
keys
():
# intercept branch key lookups
return
self
.
__getkey__
(
attr
)
@property
def
events
(
self
):
# TODO: deprecate this, since `self` is already the container type
return
iter
(
self
)
def
_keyfor
(
self
,
key
):
"""
Return the correct key for a given alias/key
"""
return
self
.
nested_aliases
.
get
(
key
,
key
)
def
__getattr__
(
self
,
attr
):
attr
=
self
.
_keyfor
(
attr
)
# if attr in self.keys() or (attr.startswith("n_") and self._keyfor(attr.split("n_")[1]) in self._grouped_branches):
if
attr
in
self
.
keys
():
return
self
.
__getitem__
(
attr
)
raise
AttributeError
(
f
"'
{
self
.
__class__
.
__name__
}
'
object has no attribute
'
{
attr
}
'"
)
return
object
.
__getattribute__
(
self
,
attr
)
def
__getitem__
(
self
,
key
):
# indexing
# TODO: maybe just propagate everything to awkward and let it deal
# with the type?
if
isinstance
(
key
,
(
slice
,
int
,
np
.
int32
,
np
.
int64
,
list
,
np
.
ndarray
,
ak
.
Array
)
):
if
isinstance
(
key
,
(
int
,
np
.
int32
,
np
.
int64
)):
key
=
int
(
key
)
return
self
.
__class__
(
self
.
_fobj
,
index_chain
=
self
.
_index_chain
+
[
key
],
step_size
=
self
.
_step_size
,
aliases
=
self
.
aliases
,
nested_branches
=
self
.
nested_branches
,
keys
=
self
.
keys
(),
event_ctor
=
self
.
_event_ctor
,
)
# group counts, for e.g. n_events, n_hits etc.
if
isinstance
(
key
,
str
)
and
key
.
startswith
(
"
n_
"
):
key
=
self
.
_keyfor
(
key
.
split
(
"
n_
"
)[
1
])
arr
=
self
.
_fobj
[
self
.
event_path
][
key
].
array
(
uproot
.
AsDtype
(
"
>i4
"
))
return
unfold_indices
(
arr
,
self
.
_index_chain
)
key
=
self
.
_keyfor
(
key
)
branch
=
self
.
_fobj
[
self
.
event_path
]
# These are special branches which are nested, like hits/trks/mc_trks
# We are explicitly grabbing just a predefined set of subbranches
# and also alias them to be backwards compatible (and attribute-accessible)
if
key
in
self
.
nested_branches
:
fields
=
[]
# some fields are not always available, like `usr_names`
for
to_field
,
from_field
in
self
.
nested_branches
[
key
].
items
():
if
from_field
in
branch
[
key
].
keys
():
fields
.
append
(
to_field
)
log
.
debug
(
fields
)
return
Branch
(
branch
[
key
],
fields
,
self
.
nested_branches
[
key
],
self
.
_index_chain
)
else
:
return
unfold_indices
(
branch
[
self
.
aliases
.
get
(
key
,
key
)].
array
(),
self
.
_index_chain
)
def
__getkey__
(
self
,
key
):
interpretation
=
self
.
_mapper
.
interpretations
.
get
(
key
)
def
__iter__
(
self
,
chunkwise
=
False
):
self
.
_events
=
self
.
_event_generator
(
chunkwise
=
chunkwise
)
return
self
if
key
==
"
usr_names
"
:
# TODO this will be fixed soon in uproot,
# see https://github.com/scikit-hep/uproot/issues/465
interpretation
=
uproot3
.
asgenobj
(
uproot3
.
SimpleArray
(
uproot3
.
STLVector
(
uproot3
.
STLString
())),
self
.
_branch
[
self
.
_keymap
[
key
]].
_context
,
6
,
def
_get_iterator_limits
(
self
):
"""
Determines start and stop, used for event iteration
"""
if
len
(
self
.
_index_chain
)
>
1
:
raise
NotImplementedError
(
"
iteration is currently not supported with nested slices
"
)
if
key
==
"
usr
"
:
# triple jagged array is wrongly parsed in uproot3
interpretation
=
uproot3
.
asgenobj
(
uproot3
.
SimpleArray
(
uproot3
.
STLVector
(
uproot3
.
asdtype
(
"
>f8
"
))),
self
.
_branch
[
self
.
_keymap
[
key
]].
_context
,
6
,
if
self
.
_index_chain
:
s
=
self
.
_index_chain
[
0
]
if
not
isinstance
(
s
,
slice
):
raise
NotImplementedError
(
"
iteration is only supported with slices
"
)
if
s
.
step
is
None
or
s
.
step
==
1
:
start
=
s
.
start
stop
=
s
.
stop
else
:
raise
NotImplementedError
(
"
iteration is only supported with single steps
"
)
else
:
start
=
None
stop
=
None
return
start
,
stop
def
_event_generator
(
self
,
chunkwise
=
False
):
start
,
stop
=
self
.
_get_iterator_limits
()
if
chunkwise
:
raise
NotImplementedError
(
"
iterating over chunks is not implemented yet
"
)
events
=
self
.
_fobj
[
self
.
event_path
]
group_count_keys
=
set
(
k
for
k
in
self
.
keys
()
if
k
.
startswith
(
"
n_
"
)
)
# extra keys to make it easy to count subbranch lengths
log
.
debug
(
"
group_count_keys: %s
"
,
group_count_keys
)
keys
=
set
(
list
(
set
(
self
.
keys
())
-
set
(
self
.
nested_branches
.
keys
())
-
set
(
self
.
nested_aliases
)
-
group_count_keys
)
out
=
self
.
_branch
[
self
.
_keymap
[
key
]].
lazyarray
(
interpretation
=
interpretation
,
basketcache
=
BASKET_CACHE
+
list
(
self
.
aliases
.
keys
())
)
# all top-level keys for regular branches
log
.
debug
(
"
keys: %s
"
,
keys
)
log
.
debug
(
"
aliases: %s
"
,
self
.
aliases
)
events_it
=
events
.
iterate
(
keys
,
aliases
=
self
.
aliases
,
step_size
=
self
.
_step_size
,
entry_start
=
start
,
entry_stop
=
stop
,
)
if
self
.
_index_chain
is
not
None
and
key
in
self
.
_mapper
.
toawkward
:
cache_key
=
self
.
_mapper
.
name
+
"
/
"
+
key
if
cache_key
not
in
self
.
_awkward_cache
:
if
len
(
out
)
>
20000
:
# It will take more than 10 seconds
print
(
"
Creating cache for
'
{}
'
.
"
.
format
(
cache_key
))
self
.
_awkward_cache
[
cache_key
]
=
ak
.
from_iter
(
out
)
out
=
self
.
_awkward_cache
[
cache_key
]
return
unfold_indices
(
out
,
self
.
_index_chain
)
def
__getitem__
(
self
,
item
):
"""
Slicing magic
"""
if
isinstance
(
item
,
str
):
return
self
.
__getkey__
(
item
)
if
isinstance
(
item
,
(
np
.
int32
,
np
.
int64
)):
item
=
int
(
item
)
# if item.__class__.__name__ == "ChunkedArray":
# item = np.array(item)
nested
=
[]
nested_keys
=
(
self
.
nested_branches
.
keys
()
)
# dict-key ordering is an implementation detail
log
.
debug
(
"
nested_keys: %s
"
,
nested_keys
)
for
key
in
nested_keys
:
nested
.
append
(
events
[
key
].
iterate
(
self
.
nested_branches
[
key
].
keys
(),
aliases
=
self
.
nested_branches
[
key
],
step_size
=
self
.
_step_size
,
entry_start
=
start
,
entry_stop
=
stop
,
)
)
group_counts
=
{}
for
key
in
group_count_keys
:
group_counts
[
key
]
=
iter
(
self
[
key
])
log
.
debug
(
"
group_counts: %s
"
,
group_counts
)
for
event_set
,
*
nested_sets
in
zip
(
events_it
,
*
nested
):
for
_event
,
*
nested_items
in
zip
(
event_set
,
*
nested_sets
):
data
=
{}
for
k
in
keys
:
data
[
k
]
=
_event
[
k
]
for
(
k
,
i
)
in
zip
(
nested_keys
,
nested_items
):
data
[
k
]
=
i
for
tokey
,
fromkey
in
self
.
nested_aliases
.
items
():
data
[
tokey
]
=
data
[
fromkey
]
for
key
in
group_counts
:
data
[
key
]
=
next
(
group_counts
[
key
])
yield
self
.
_event_ctor
(
**
data
)
return
self
.
__class__
(
self
.
_tree
,
self
.
_mapper
,
index_chain
=
self
.
_index_chain
+
[
item
],
keymap
=
self
.
_keymap
,
subbranchmaps
=
self
.
_subbranchmaps
,
awkward_cache
=
self
.
_awkward_cache
,
)
def
__next__
(
self
):
return
next
(
self
.
_events
)
def
__len__
(
self
):
if
not
self
.
_index_chain
:
return
len
(
self
.
_
branch
)
return
self
.
_
fobj
[
self
.
event_path
].
num_entries
elif
isinstance
(
self
.
_index_chain
[
-
1
],
(
int
,
np
.
int32
,
np
.
int64
)):
if
len
(
self
.
_index_chain
)
==
1
:
try
:
return
len
(
self
[:])
except
IndexError
:
return
1
# TODO: not sure why this is needed at all, it's too late...
return
1
# try:
# return len(self[:])
# except IndexError:
# return 1
return
1
else
:
# ignore the usual index magic and access `id` directly
return
len
(
unfold_indices
(
self
.
_branch
[
self
.
_keymap
[
"
id
"
]].
lazyarray
(
basketcache
=
BASKET_CACHE
),
self
.
_index_chain
,
self
.
_fobj
[
self
.
event_path
][
"
id
"
].
array
(),
self
.
_index_chain
)
)
def
__actual_len__
(
self
):
"""
The raw number of events without any indexing/slicing magic
"""
return
len
(
self
.
_fobj
[
self
.
event_path
][
"
id
"
].
array
())
def
__repr__
(
self
):
length
=
len
(
self
)
actual_length
=
self
.
__actual_len__
()
return
f
"
{
self
.
__class__
.
__name__
}
(
{
length
}{
'
/
'
+
str
(
actual_length
)
if
length
<
actual_length
else
''
}
events)
"
@property
def
is_single
(
self
):
"""
Returns True when a single branch is selected.
"""
if
len
(
self
.
_index_chain
)
>
0
:
if
isinstance
(
self
.
_index_chain
[
0
],
(
int
,
np
.
int32
,
np
.
int64
)):
return
True
return
False
def
__iter__
(
self
):
self
.
_iterator_index
=
0
def
uuid
(
self
):
return
self
.
_uuid
def
close
(
self
):
self
.
_fobj
.
close
()
def
__enter__
(
self
):
return
self
def
__next__
(
self
):
idx
=
self
.
_iterator_index
self
.
_iterator_index
+=
1
if
idx
>=
len
(
self
):
raise
StopIteration
return
self
[
idx
]
def
__exit__
(
self
,
*
args
):
self
.
close
()
def
__str__
(
self
):
length
=
len
(
self
)
return
"
{} ({}) with {} element{}
"
.
format
(
self
.
__class__
.
__name__
,
self
.
_mapper
.
name
,
length
,
"
s
"
if
length
>
1
else
""
,
class
Branch
:
"""
Helper class for nested branches likes tracks/hits
"""
def
__init__
(
self
,
branch
,
fields
,
aliases
,
index_chain
):
self
.
_branch
=
branch
self
.
fields
=
fields
self
.
_aliases
=
aliases
self
.
_index_chain
=
index_chain
def
__dir__
(
self
):
"""
Tab completion in IPython
"""
return
list
(
self
.
fields
)
def
__getattr__
(
self
,
attr
):
if
attr
not
in
self
.
_aliases
:
raise
AttributeError
(
f
"
No field named
{
attr
}
. Available fields:
{
self
.
fields
}
"
)
key
=
self
.
_aliases
[
attr
]
if
self
.
_index_chain
:
idx0
=
self
.
_index_chain
[
0
]
if
isinstance
(
idx0
,
(
int
,
np
.
int32
,
np
.
int64
)):
# optimise single-element and slice lookups
start
=
idx0
stop
=
idx0
+
1
arr
=
ak
.
flatten
(
self
.
_branch
[
key
].
array
(
entry_start
=
start
,
entry_stop
=
stop
)
)
return
unfold_indices
(
arr
,
self
.
_index_chain
[
1
:])
if
isinstance
(
idx0
,
slice
):
if
idx0
.
step
is
None
or
idx0
.
step
==
1
:
start
=
idx0
.
start
stop
=
idx0
.
stop
arr
=
self
.
_branch
[
key
].
array
(
entry_start
=
start
,
entry_stop
=
stop
)
return
unfold_indices
(
arr
,
self
.
_index_chain
[
1
:])
return
unfold_indices
(
self
.
_branch
[
key
].
array
(),
self
.
_index_chain
)
def
__getitem__
(
self
,
key
):
return
self
.
__class__
(
self
.
_branch
,
self
.
fields
,
self
.
_aliases
,
self
.
_index_chain
+
[
key
]
)
def
__len__
(
self
):
if
not
self
.
_index_chain
:
return
self
.
_branch
.
num_entries
elif
isinstance
(
self
.
_index_chain
[
-
1
],
(
int
,
np
.
int32
,
np
.
int64
)):
if
len
(
self
.
_index_chain
)
==
1
:
return
1
# try:
# return len(self[:])
# except IndexError:
# return 1
return
1
else
:
# ignore the usual index magic and access `id` directly
return
len
(
self
.
id
)
def
__actual_len__
(
self
):
"""
The raw number of events without any indexing/slicing magic
"""
return
len
(
self
.
_branch
[
self
.
_aliases
[
"
id
"
]].
array
())
def
__repr__
(
self
):
length
=
len
(
self
)
return
"
<{}[{}]: {} element{}>
"
.
format
(
self
.
__class__
.
__name__
,
self
.
_mapper
.
name
,
length
,
"
s
"
if
length
>
1
else
""
,
)
actual_length
=
self
.
__actual_len__
()
return
f
"
{
self
.
__class__
.
__name__
}
(
{
length
}{
'
/
'
+
str
(
actual_length
)
if
length
<
actual_length
else
''
}
{
self
.
_branch
.
name
}
)
"
@property
def
ndim
(
self
):
if
not
self
.
_index_chain
:
return
2
elif
any
(
isinstance
(
i
,
(
int
,
np
.
int32
,
np
.
int64
))
for
i
in
self
.
_index_chain
):
return
1
return
2
Loading