Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
S
SMART
Project
Project
Details
Activity
Releases
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
3
Issues
3
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Registry
Registry
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
UNI-KLU
SMART
Commits
4d887b0a
Commit
4d887b0a
authored
Dec 18, 2020
by
Alexander Lercher
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
Extracted methods for db access from time slicing
parent
688215a0
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
31 additions
and
8 deletions
+31
-8
repository.py
...ub/role-stage-discovery-microservice/app/db/repository.py
+1
-1
run_time_slicing.py
...role-stage-discovery-microservice/app/run_time_slicing.py
+30
-7
No files found.
src/data-hub/role-stage-discovery-microservice/app/db/repository.py
View file @
4d887b0a
...
...
@@ -73,7 +73,7 @@ class Repository(MongoRepositoryBase):
def
add_layer_nodes
(
self
,
nodes
:
List
[
dict
]):
super
()
.
insert_many
(
self
.
_layer_nodes_collection
,
nodes
)
def
get_layer_nodes
(
self
,
use_case
:
str
,
use_case_table
:
str
,
layer_name
:
str
)
->
dict
:
def
get_layer_nodes
(
self
,
use_case
:
str
,
use_case_table
:
str
,
layer_name
:
str
)
->
List
[
dict
]
:
'''Returns all nodes for the use-case and layer.'''
entries
=
super
()
.
get_entries
(
self
.
_layer_nodes_collection
,
selection
=
{
'use_case'
:
use_case
,
'use_case_table'
:
use_case_table
,
'layer_name'
:
layer_name
},
projection
=
{
'_id'
:
0
})
return
[
e
for
e
in
entries
]
...
...
src/data-hub/role-stage-discovery-microservice/app/run_time_slicing.py
View file @
4d887b0a
...
...
@@ -15,6 +15,9 @@ TimeSliceKey = Tuple[int, int]
# TODO extract information about time features (maybe from table mapping)
TIME_PROPERTY_NAMES
=
[
'Timestamp'
]
repo
=
Repository
()
def
convert_to_time_slice_key
(
timestamp
:
str
)
->
TimeSliceKey
:
'''Returns the tuple (year, week_of_year) from a timestamp. This is used as the key for the slicing.'''
# time = datetime.utcfromtimestamp(float(timestamp[0:10]))
...
...
@@ -52,22 +55,37 @@ def split_clusterset_by_time(layer: Layer, clusters: List[Cluster]) -> Dict[Time
return
time_slices
if
__name__
==
"__main__"
:
re
po
=
Repository
()
def
get_layers
()
:
re
turn
repo
.
get_layers
()
repo
.
remove_all_time_slices
()
def
get_clusters_for_layer
(
use_case
,
use_case_table
,
layer_name
):
return
repo
.
get_clusters_for_layer
(
use_case
,
use_case_table
,
layer_name
)
layers
=
repo
.
get_layers
()
def
get_layer_nodes
(
use_case
,
use_case_table
,
layer_name
):
return
repo
.
get_layer_nodes
(
use_case
,
use_case_table
,
layer_name
)
def
add_time_slice
(
timeslice
):
repo
.
add_time_slice
(
timeslice
)
def
run_time_slicing
(
selected_use_cases
:
List
[
str
]
=
None
,
selected_use_case_tables
:
List
[
str
]
=
None
,
selected_layer_names
:
List
[
str
]
=
None
):
layers
=
get_layers
()
for
layer
in
layers
:
layer_name
=
layer
.
layer_name
use_case
=
layer
.
use_case
use_case_table
=
layer
.
use_case_table
# skip layers not in the params
if
selected_use_cases
is
not
None
and
use_case
not
in
selected_use_cases
\
or
selected_use_case_tables
is
not
None
and
use_case_table
not
in
selected_use_case_tables
\
or
selected_layer_names
is
not
None
and
layer_name
not
in
selected_layer_names
:
continue
print
(
f
"Working on {use_case}//{use_case_table}//{layer_name}."
)
clusters_for_layer
=
repo
.
get_clusters_for_layer
(
use_case
,
use_case_table
,
layer_name
)
clusters_for_layer
=
get_clusters_for_layer
(
use_case
,
use_case_table
,
layer_name
)
# if no clusters were generated use one large cluster instead of skipping the layer
if
clusters_for_layer
is
None
or
len
(
clusters_for_layer
)
==
0
:
nodes
=
repo
.
get_layer_nodes
(
use_case
,
use_case_table
,
layer_name
)
nodes
=
get_layer_nodes
(
use_case
,
use_case_table
,
layer_name
)
if
nodes
is
None
or
len
(
nodes
)
==
0
:
print
(
"Skipping, because there are no clusters and no nodes for the layer."
)
continue
...
...
@@ -76,4 +94,9 @@ if __name__ == "__main__":
time_slices
=
split_clusterset_by_time
(
layer
,
clusters_for_layer
)
for
k
,
v
in
time_slices
.
items
():
repo
.
add_time_slice
(
v
)
add_time_slice
(
v
)
if
__name__
==
"__main__"
:
repo
.
remove_all_time_slices
()
run_time_slicing
([],[],[])
\ No newline at end of file
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment