Skip to content

Commit 83d05ea

Browse files
authored
Merge pull request #153 from Oxid15/develop
0.10.0 - Update
2 parents 6adfcbb + 6211d38 commit 83d05ea

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

51 files changed

+1639
-692
lines changed

cascade/__init__.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@
1515
"""
1616

1717

18-
__version__ = '0.9.0'
18+
__version__ = '0.10.0'
1919
__author__ = 'Ilia Moiseev'
2020
__author_email__ = '[email protected]'
2121

cascade/base/__init__.py

+23-3
Original file line numberDiff line numberDiff line change
@@ -14,10 +14,30 @@
1414
limitations under the License.
1515
"""
1616

17-
from typing import List, Dict, Any
17+
from typing import Union, List, Dict, Any
18+
19+
"""
20+
Single Meta of basic object is just a dict, however Cascade supports
21+
pipelines with lists of meta.
22+
23+
Do not use Meta when returning from `get_meta` methods! Use PipeMeta instead.
24+
Meta type alias is designed for better readability and to explicitly state when the
25+
variable is meta.
26+
"""
27+
Meta = Dict[Any, Any]
28+
29+
"""
30+
This type is used when `get_meta` is called on any Traceable
31+
"""
32+
PipeMeta = List[Meta]
33+
34+
"""
35+
This type described what we can get when reading previously written to meta object
36+
"""
37+
MetaFromFile = Union[List[Any], Dict[Any, Any]]
1838

19-
Meta = List[Dict[Any, Any]]
2039

2140
from .meta_handler import MetaHandler, supported_meta_formats
22-
from .traceable import Traceable, Meta
41+
from .traceable import Traceable
2342
from .meta_handler import CustomEncoder as JSONEncoder
43+
from .history_logger import HistoryLogger

cascade/base/history_logger.py

+71
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,71 @@
1+
"""
2+
Copyright 2022 Ilia Moiseev
3+
4+
Licensed under the Apache License, Version 2.0 (the "License");
5+
you may not use this file except in compliance with the License.
6+
You may obtain a copy of the License at
7+
8+
http://www.apache.org/licenses/LICENSE-2.0
9+
10+
Unless required by applicable law or agreed to in writing, software
11+
distributed under the License is distributed on an "AS IS" BASIS,
12+
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13+
See the License for the specific language governing permissions and
14+
limitations under the License.
15+
"""
16+
17+
import os
18+
from typing import Any
19+
from .meta_handler import MetaHandler
20+
21+
22+
class HistoryLogger:
23+
"""
24+
An interface to log meta into history files
25+
"""
26+
def __init__(self, filepath: str) -> None:
27+
"""
28+
Parameters
29+
----------
30+
filepath: str
31+
Path to the history log file
32+
"""
33+
self._mh = MetaHandler()
34+
self._log_file = filepath
35+
36+
if os.path.exists(self._log_file):
37+
try:
38+
self._log = self._mh.read(self._log_file)
39+
if isinstance(self._log, list):
40+
raise RuntimeError(
41+
f'Failed to initialize history logger due to unexpected object'
42+
f' format - log is the instance of list and not dict.'
43+
f' Check your {self._log_file} file')
44+
if 'history' not in self._log:
45+
raise RuntimeError(
46+
f'Failed to initialize history logger due to unexpected object'
47+
f' format - "history" key is missing.'
48+
f' Check your {self._log_file} file')
49+
except IOError as e:
50+
raise IOError(f'Failed to read log file: {self._log_file }') from e
51+
else:
52+
self._log = {
53+
'history': [],
54+
'type': 'history'
55+
}
56+
57+
def log(self, obj: Any) -> None:
58+
"""
59+
Logs the state of the object
60+
61+
Parameters
62+
----------
63+
obj: Any
64+
Meta data of the object
65+
"""
66+
self._log['history'].append(obj)
67+
68+
try:
69+
self._mh.write(self._log_file, self._log)
70+
except IOError as e:
71+
raise IOError(f'Failed to write log file: {self._log_file}') from e

cascade/base/meta_handler.py

+16-12
Original file line numberDiff line numberDiff line change
@@ -17,15 +17,16 @@
1717
import os
1818
import json
1919
import datetime
20-
from typing import NoReturn, Union, List, Dict, Any
20+
from typing import NoReturn, Union, Dict, Any
2121
from json import JSONEncoder
22+
import deepdiff
2223

2324
import yaml
2425
import numpy as np
2526

26-
from . import Meta
27+
from . import MetaFromFile
2728

28-
supported_meta_formats = ('.json', '.yml')
29+
supported_meta_formats = ('.json', '.yml', '.yaml')
2930

3031

3132
class CustomEncoder(JSONEncoder):
@@ -59,14 +60,17 @@ def default(self, obj: Any) -> Any:
5960
elif isinstance(obj, np.void):
6061
return None
6162

63+
elif isinstance(obj, deepdiff.model.PrettyOrderedSet):
64+
return list(obj)
65+
6266
return super(CustomEncoder, self).default(obj)
6367

64-
def obj_to_dict(self, obj: Any) -> Dict:
68+
def obj_to_dict(self, obj: Any) -> Any:
6569
return json.loads(self.encode(obj))
6670

6771

6872
class BaseHandler:
69-
def read(self, path: str) -> Union[List[Any], Dict[Any, Any]]:
73+
def read(self, path: str) -> MetaFromFile:
7074
raise NotImplementedError()
7175

7276
def write(self, path: str, obj: Any, overwrite: bool = True) -> None:
@@ -83,7 +87,7 @@ def _raise_io_error(self, path: str, exc: Union[Exception, None] = None) -> NoRe
8387

8488

8589
class JSONHandler(BaseHandler):
86-
def read(self, path: str) -> Union[List[Any], Dict[Any, Any]]:
90+
def read(self, path: str) -> MetaFromFile:
8791
_, ext = os.path.splitext(path)
8892
if ext == '':
8993
path += '.json'
@@ -97,7 +101,7 @@ def read(self, path: str) -> Union[List[Any], Dict[Any, Any]]:
97101
self._raise_io_error(path, e)
98102
return meta
99103

100-
def write(self, path: str, obj: List[Dict], overwrite: bool = True) -> None:
104+
def write(self, path: str, obj: Any, overwrite: bool = True) -> None:
101105
if not overwrite and os.path.exists(path):
102106
return
103107

@@ -106,7 +110,7 @@ def write(self, path: str, obj: List[Dict], overwrite: bool = True) -> None:
106110

107111

108112
class YAMLHandler(BaseHandler):
109-
def read(self, path: str) -> Union[List[Any], Dict[Any, Any]]:
113+
def read(self, path: str) -> MetaFromFile:
110114
_, ext = os.path.splitext(path)
111115
if ext == '':
112116
path += '.yml'
@@ -156,7 +160,7 @@ class MetaHandler:
156160
"""
157161
Encapsulates the logic of reading and writing metadata to disk.
158162
159-
Supported read-write formats are `json` and `yml`. Other formats
163+
Supported read-write formats are `.json` and `.yml` or `.yaml`. Other formats
160164
are supported as read-only. For example one can read meta from txt or md file.
161165
162166
Examples
@@ -168,7 +172,7 @@ class MetaHandler:
168172
>>> mh.write('meta.yml', {'hello': 'world'})
169173
>>> obj = mh.read('meta.yml')
170174
"""
171-
def read(self, path: str) -> Union[List[Any], Dict[Any, Any]]:
175+
def read(self, path: str) -> MetaFromFile:
172176
"""
173177
Reads object from path.
174178
@@ -179,7 +183,7 @@ def read(self, path: str) -> Union[List[Any], Dict[Any, Any]]:
179183
180184
Returns
181185
-------
182-
obj: Union[List[Any], Dict[Any, Any]]
186+
obj: MetaFromFile
183187
184188
Raises
185189
------
@@ -215,7 +219,7 @@ def _get_handler(self, path: str) -> BaseHandler:
215219
ext = os.path.splitext(path)[-1]
216220
if ext == '.json':
217221
return JSONHandler()
218-
elif ext == '.yml':
222+
elif ext in ('.yml', '.yaml'):
219223
return YAMLHandler()
220224
else:
221225
return TextHandler()

cascade/base/traceable.py

+13-11
Original file line numberDiff line numberDiff line change
@@ -16,9 +16,8 @@
1616

1717

1818
import warnings
19-
from typing import List, Dict, Union, Any
20-
21-
from . import Meta
19+
from typing import Dict, Union, Any
20+
from . import PipeMeta, MetaFromFile
2221

2322

2423
class Traceable:
@@ -29,13 +28,13 @@ class Traceable:
2928
def __init__(
3029
self,
3130
*args: Any,
32-
meta_prefix: Union[Meta, str, None] = None,
31+
meta_prefix: Union[Dict[Any, Any], str, None] = None,
3332
**kwargs: Any
3433
) -> None:
3534
"""
3635
Parameters
3736
----------
38-
meta_prefix: Union[Dict, str], optional
37+
meta_prefix: Union[Dict[Any, Any], str], optional
3938
The dictionary that is used to update object's meta in `get_meta` call.
4039
Due to the call of update can overwrite default values.
4140
If str - prefix assumed to be path and loaded using MetaHandler.
@@ -51,19 +50,22 @@ def __init__(
5150
self._meta_prefix = meta_prefix
5251

5352
@staticmethod
54-
def _read_meta_from_file(path: str) -> Union[List[Any], Dict[Any, Any]]:
53+
def _read_meta_from_file(path: str) -> MetaFromFile:
5554
from . import MetaHandler
5655
return MetaHandler().read(path)
5756

58-
def get_meta(self) -> List[Dict]:
57+
def get_meta(self) -> PipeMeta:
5958
"""
6059
Returns
6160
-------
62-
meta: List[Dict]
63-
A list where last element is this object's metadata.
61+
meta: PipeMeta
62+
A list where first element is this object's metadata.
63+
All other elements represent the other stages of pipeline if present.
64+
6465
Meta can be anything that is worth to document about
6566
the object and its properties.
66-
Meta is list to allow the formation of pipelines.
67+
68+
Meta is a list (see PipeMeta type alias) to allow the formation of pipelines.
6769
"""
6870
meta = {
6971
'name': repr(self)
@@ -74,7 +76,7 @@ def get_meta(self) -> List[Dict]:
7476
self._warn_no_prefix()
7577
return [meta]
7678

77-
def update_meta(self, obj: Union[Dict, str]) -> None:
79+
def update_meta(self, obj: Union[Dict[Any, Any], str]) -> None:
7880
"""
7981
Updates `_meta_prefix`, which then updates
8082
dataset's meta when `get_meta()` is called

cascade/data/apply_modifier.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@
1414
limitations under the License.
1515
"""
1616

17-
from typing import Callable, Any, List, Dict
17+
from typing import Callable, Any
1818
from . import Dataset, Modifier, T
1919

2020

@@ -23,7 +23,7 @@ class ApplyModifier(Modifier):
2323
Modifier that maps a function to given dataset's items in a lazy way.
2424
"""
2525
def __init__(self, dataset: Dataset[T], func: Callable[[T], Any],
26-
*args: List[Any], **kwargs: Dict[Any, Any]) -> None:
26+
*args: Any, **kwargs: Any) -> None:
2727
"""
2828
Parameters
2929
----------

cascade/data/composer.py

+3-3
Original file line numberDiff line numberDiff line change
@@ -15,10 +15,10 @@
1515
"""
1616

1717

18-
from typing import List, Tuple, Dict, Any
18+
from typing import List, Tuple, Any
1919

2020
from . import SizedDataset
21-
from ..base import Meta
21+
from ..base import PipeMeta
2222

2323

2424
class Composer(SizedDataset):
@@ -62,7 +62,7 @@ def __getitem__(self, index: int) -> Tuple[Any]:
6262
def __len__(self) -> int:
6363
return self._len
6464

65-
def get_meta(self) -> Meta:
65+
def get_meta(self) -> PipeMeta:
6666
"""
6767
Composer calls `get_meta()` of all its datasets
6868
"""

cascade/data/concatenator.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,7 @@
1818

1919
import numpy as np
2020
from .dataset import SizedDataset, T
21-
from ..base import Meta
21+
from ..base import PipeMeta
2222

2323

2424
class Concatenator(SizedDataset):
@@ -71,7 +71,7 @@ def __repr__(self) -> str:
7171
rp = super().__repr__()
7272
return f'{rp} of\n' + '\n'.join(repr(ds) for ds in self._datasets)
7373

74-
def get_meta(self) -> Meta:
74+
def get_meta(self) -> PipeMeta:
7575
"""
7676
Concatenator calls `get_meta()` of all its datasets
7777
"""

0 commit comments

Comments
 (0)