code-loader 1.0.91.dev4__tar.gz → 1.0.91.dev6__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (32) hide show
  1. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/PKG-INFO +1 -1
  2. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/contract/datasetclasses.py +6 -7
  3. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/inner_leap_binder/leapbinder.py +28 -2
  4. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/inner_leap_binder/leapbinder_decorators.py +26 -14
  5. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/leaploader.py +30 -0
  6. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/leaploaderbase.py +9 -1
  7. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/utils.py +11 -2
  8. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/pyproject.toml +1 -1
  9. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/LICENSE +0 -0
  10. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/README.md +0 -0
  11. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/__init__.py +0 -0
  12. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/contract/__init__.py +0 -0
  13. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/contract/enums.py +0 -0
  14. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/contract/exceptions.py +0 -0
  15. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/contract/mapping.py +0 -0
  16. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/contract/responsedataclasses.py +0 -0
  17. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/contract/visualizer_classes.py +0 -0
  18. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/default_losses.py +0 -0
  19. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/default_metrics.py +0 -0
  20. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/experiment_api/__init__.py +0 -0
  21. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/experiment_api/api.py +0 -0
  22. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/experiment_api/cli_config_utils.py +0 -0
  23. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/experiment_api/client.py +0 -0
  24. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/experiment_api/epoch.py +0 -0
  25. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/experiment_api/experiment.py +0 -0
  26. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/experiment_api/experiment_context.py +0 -0
  27. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/experiment_api/types.py +0 -0
  28. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/experiment_api/utils.py +0 -0
  29. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/experiment_api/workingspace_config_utils.py +0 -0
  30. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/inner_leap_binder/__init__.py +0 -0
  31. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/visualizers/__init__.py +0 -0
  32. {code_loader-1.0.91.dev4 → code_loader-1.0.91.dev6}/code_loader/visualizers/default_visualizers.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: code-loader
3
- Version: 1.0.91.dev4
3
+ Version: 1.0.91.dev6
4
4
  Summary:
5
5
  Home-page: https://github.com/tensorleap/code-loader
6
6
  License: MIT
@@ -39,6 +39,8 @@ class PreprocessResponse:
39
39
  state: Optional[DataStateType] = None
40
40
  sample_id_type: Optional[Union[Type[str], Type[int]]] = None
41
41
  sample_ids_to_instance_mappings: Optional[Dict[Union[str, int], Union[List[str], List[int]]]] = None # in use only for element instance
42
+ instance_to_sample_ids_mappings: Optional[Dict[Union[str, int], Union[List[str], List[int]]]] = None # in use only for element instance
43
+
42
44
 
43
45
  def __post_init__(self) -> None:
44
46
  def is_valid_string(s: str) -> bool:
@@ -68,6 +70,7 @@ class PreprocessResponse:
68
70
 
69
71
 
70
72
  SectionCallableInterface = Callable[[Union[int, str], PreprocessResponse], npt.NDArray[np.float32]]
73
+ InstanceCallableInterface = Callable[[int, PreprocessResponse], List[npt.NDArray[np.float32]]]
71
74
 
72
75
  MetadataSectionCallableInterface = Union[
73
76
  Callable[[Union[int, str], PreprocessResponse], int],
@@ -190,14 +193,9 @@ class InputHandler(DatasetBaseHandler):
190
193
  channel_dim: Optional[int] = -1
191
194
 
192
195
  @dataclass
193
- class ElementInstance:
196
+ class ElementInstanceMasksHandler:
194
197
  name: str
195
- mask: npt.NDArray[np.float32]
196
-
197
- @dataclass
198
- class ElementInstanceHandler:
199
- input_name: str
200
- instance_function: [[int, PreprocessResponse], List[ElementInstance]]
198
+ instance_function: InstanceCallableInterface
201
199
 
202
200
  @dataclass
203
201
  class GroundTruthHandler(DatasetBaseHandler):
@@ -233,6 +231,7 @@ class DatasetIntegrationSetup:
233
231
  unlabeled_data_preprocess: Optional[UnlabeledDataPreprocessHandler] = None
234
232
  visualizers: List[VisualizerHandler] = field(default_factory=list)
235
233
  inputs: List[InputHandler] = field(default_factory=list)
234
+ instance_masks: List[ElementInstanceMasksHandler] = field(default_factory=list)
236
235
  ground_truths: List[GroundTruthHandler] = field(default_factory=list)
237
236
  metadata: List[MetadataHandler] = field(default_factory=list)
238
237
  prediction_types: List[PredictionTypeHandler] = field(default_factory=list)
@@ -10,14 +10,15 @@ from code_loader.contract.datasetclasses import SectionCallableInterface, InputH
10
10
  MetadataSectionCallableInterface, UnlabeledDataPreprocessHandler, CustomLayerHandler, MetricHandler, \
11
11
  CustomCallableInterfaceMultiArgs, ConfusionMatrixCallableInterfaceMultiArgs, LeapData, \
12
12
  CustomMultipleReturnCallableInterfaceMultiArgs, DatasetBaseHandler, custom_latent_space_attribute, \
13
- RawInputsForHeatmap, VisualizerHandlerData, MetricHandlerData, CustomLossHandlerData, SamplePreprocessResponse
13
+ RawInputsForHeatmap, VisualizerHandlerData, MetricHandlerData, CustomLossHandlerData, SamplePreprocessResponse, \
14
+ ElementInstanceMasksHandler, InstanceCallableInterface
14
15
  from code_loader.contract.enums import LeapDataType, DataStateEnum, DataStateType, MetricDirection, DatasetMetadataType
15
16
  from code_loader.contract.mapping import NodeConnection, NodeMapping, NodeMappingType
16
17
  from code_loader.contract.responsedataclasses import DatasetTestResultPayload
17
18
  from code_loader.contract.visualizer_classes import map_leap_data_type_to_visualizer_class
18
19
  from code_loader.default_losses import loss_name_to_function
19
20
  from code_loader.default_metrics import metrics_names_to_functions_and_direction
20
- from code_loader.utils import to_numpy_return_wrapper, get_shape
21
+ from code_loader.utils import to_numpy_return_wrapper, get_shape, to_numpy_return_masks_wrapper
21
22
  from code_loader.visualizers.default_visualizers import DefaultVisualizer, \
22
23
  default_graph_visualizer, \
23
24
  default_image_visualizer, default_horizontal_bar_visualizer, default_word_visualizer, \
@@ -234,6 +235,31 @@ class LeapBinder:
234
235
 
235
236
  self._encoder_names.append(name)
236
237
 
238
+
239
+ def set_instance_masks(self, function: InstanceCallableInterface, name: str) -> None:
240
+ """
241
+ Set the input handler function.
242
+
243
+ Args:
244
+ function (SectionCallableInterface): The input handler function.
245
+ name (str): The name of the input section.
246
+ channel_dim (int): The dimension of the channels axis
247
+
248
+ Example:
249
+ def input_encoder(subset: PreprocessResponse, index: int) -> np.ndarray:
250
+ # Return the processed input data for the given index and given subset response
251
+ img_path = subset.`data["images"][idx]
252
+ img = read_img(img_path)
253
+ img = normalize(img)
254
+ return img
255
+
256
+ leap_binder.set_input(input_encoder, name='input_encoder', channel_dim=-1)
257
+ """
258
+ function = to_numpy_return_masks_wrapper(function)
259
+ self.setup_container.instance_masks.append(ElementInstanceMasksHandler(name, function))
260
+
261
+ self._encoder_names.append(name)
262
+
237
263
  def add_custom_loss(self, function: CustomCallableInterface, name: str) -> None:
238
264
  """
239
265
  Add a custom loss function to the setup.
@@ -8,7 +8,7 @@ import numpy.typing as npt
8
8
  from code_loader.contract.datasetclasses import CustomCallableInterfaceMultiArgs, \
9
9
  CustomMultipleReturnCallableInterfaceMultiArgs, ConfusionMatrixCallableInterfaceMultiArgs, CustomCallableInterface, \
10
10
  VisualizerCallableInterface, MetadataSectionCallableInterface, PreprocessResponse, SectionCallableInterface, \
11
- ConfusionMatrixElement, SamplePreprocessResponse
11
+ ConfusionMatrixElement, SamplePreprocessResponse, InstanceCallableInterface
12
12
  from code_loader.contract.enums import MetricDirection, LeapDataType, DatasetMetadataType
13
13
  from code_loader import leap_binder
14
14
  from code_loader.contract.mapping import NodeMapping, NodeMappingType, NodeConnection
@@ -276,14 +276,19 @@ def tensorleap_element_instance_preprocess(instance_mask_encoder: Callable[[int,
276
276
  result = user_function()
277
277
  for preprocess_response in result:
278
278
  sample_ids_to_instance_mappings = {}
279
+ instance_to_sample_ids_mappings = {}
279
280
  all_sample_ids = preprocess_response.sample_ids.copy()
280
281
  for sample_id in preprocess_response.sample_ids:
281
282
  data_length = len(all_sample_ids)
282
283
  instances_masks = instance_mask_encoder(sample_id, preprocess_response)
283
284
  instances_ids = list(range(data_length, data_length + len(instances_masks)))
284
285
  sample_ids_to_instance_mappings[sample_id] = instances_ids
286
+ instance_to_sample_ids_mappings[sample_id] = sample_id
287
+ for instance_id in instances_ids:
288
+ instance_to_sample_ids_mappings[instance_id] = sample_id
285
289
  all_sample_ids.extend(instances_ids)
286
290
  preprocess_response.sample_ids_to_instance_mappings = sample_ids_to_instance_mappings
291
+ preprocess_response.instance_to_sample_ids_mappings = instance_to_sample_ids_mappings
287
292
  preprocess_response.sample_ids = all_sample_ids
288
293
  return result
289
294
 
@@ -342,23 +347,30 @@ def tensorleap_unlabeled_preprocess():
342
347
  return decorating_function
343
348
 
344
349
 
345
- def tensorleap_instance_encoder():
346
- def decorating_function(user_function: Callable[[], PreprocessResponse]):
347
- leap_binder.set_unlabeled_data_preprocess(user_function)
350
+ def tensorleap_instances_masks_encoder(name: str, model_input_index=None):
351
+ def decorating_function(user_function: InstanceCallableInterface):
352
+ leap_binder.set_instance_masks(user_function, name)
348
353
 
349
- def _validate_input_args(*args, **kwargs):
350
- assert len(args) == 0 and len(kwargs) == 0, \
351
- (f'tensorleap_instance_encoder validation failed: '
352
- f'The function should not take any arguments. Got {args} and {kwargs}.')
354
+ def _validate_input_args(sample_id: Union[int, str], preprocess_response: PreprocessResponse):
355
+ assert isinstance(sample_id, (int, str)), \
356
+ (f'tensorleap_input_encoder validation failed: '
357
+ f'Argument sample_id should be either int or str. Got {type(sample_id)}.')
358
+ assert isinstance(preprocess_response, PreprocessResponse), \
359
+ (f'tensorleap_input_encoder validation failed: '
360
+ f'Argument preprocess_response should be a PreprocessResponse. Got {type(preprocess_response)}.')
361
+ assert type(sample_id) == preprocess_response.sample_id_type, \
362
+ (f'tensorleap_input_encoder validation failed: '
363
+ f'Argument sample_id should be as the same type as defined in the preprocess response '
364
+ f'{preprocess_response.sample_id_type}. Got {type(sample_id)}.')
353
365
 
354
366
  def _validate_result(result):
355
- assert isinstance(result, PreprocessResponse), \
356
- (f'tensorleap_instance_encoder validation failed: '
357
- f'The return type should be a PreprocessResponse. Got {type(result)}.')
367
+ assert isinstance(result, list), \
368
+ (f'tensorleap_input_encoder validation failed: '
369
+ f'Unsupported return type. Should be a numpy array. Got {type(result)}.')
358
370
 
359
- def inner(*args, **kwargs):
360
- _validate_input_args(*args, **kwargs)
361
- result = user_function()
371
+ def inner(sample_id, preprocess_response):
372
+ _validate_input_args(sample_id, preprocess_response)
373
+ result = user_function(sample_id, preprocess_response)
362
374
  _validate_result(result)
363
375
  return result
364
376
 
@@ -150,6 +150,21 @@ class LeapLoader(LeapLoaderBase):
150
150
  state=state)
151
151
  return sample
152
152
 
153
+ def get_sample_masks(self, state: DataStateEnum, sample_id: Union[int, str]) -> List[DatasetSample]:
154
+ self.exec_script()
155
+ preprocess_result = self._preprocess_result()
156
+ if state == DataStateEnum.unlabeled and sample_id not in preprocess_result[state].sample_ids:
157
+ self._preprocess_result(update_unlabeled_preprocess=True)
158
+
159
+ metadata, metadata_is_none = self._get_metadata(state, sample_id)
160
+ sample = DatasetSample(inputs=self._get_inputs(state, sample_id),
161
+ gt=None if state == DataStateEnum.unlabeled else self._get_gt(state, sample_id),
162
+ metadata=metadata,
163
+ metadata_is_none=metadata_is_none,
164
+ index=sample_id,
165
+ state=state)
166
+ return sample
167
+
153
168
  def check_dataset(self) -> DatasetIntegParseResult:
154
169
  test_payloads: List[DatasetTestResultPayload] = []
155
170
  setup_response = None
@@ -505,3 +520,18 @@ class LeapLoader(LeapLoaderBase):
505
520
  raise Exception("Different id types in preprocess results")
506
521
 
507
522
  return id_type
523
+
524
+ def get_instances_data(self, state: DataStateEnum) -> Tuple[Dict[Union[int, str], List[Union[int, str]]], Dict[Union[int, str], List[Union[int, str]]], List[Union[int, str]]]:
525
+ """
526
+ This Method get the data state and returns two dictionaries that holds the mapping of the sample ids to their
527
+ instances and the other way around and the sample ids array.
528
+ Args:
529
+ state: DataStateEnum state
530
+ Returns:
531
+ sample_ids_to_instance_mappings: sample id to instance mappings
532
+ instance_to_sample_ids_mappings: instance to sample ids mappings
533
+ sample_ids: sample ids array
534
+ """
535
+ preprocess_result = self._preprocess_result()
536
+ preprocess_state = preprocess_result[state]
537
+ return preprocess_state.sample_ids_to_instance_mappings, preprocess_state.instance_to_sample_ids_mappings, preprocess_state.sample_ids
@@ -2,7 +2,7 @@
2
2
 
3
3
  from abc import abstractmethod
4
4
 
5
- from typing import Dict, List, Union, Type, Optional
5
+ from typing import Dict, List, Union, Type, Optional, Tuple
6
6
 
7
7
  import numpy as np
8
8
  import numpy.typing as npt
@@ -64,6 +64,14 @@ class LeapLoaderBase:
64
64
  def get_sample(self, state: DataStateEnum, sample_id: Union[int, str]) -> DatasetSample:
65
65
  pass
66
66
 
67
+ @abstractmethod
68
+ def get_instances_data(self, state: DataStateEnum) -> Tuple[Dict[Union[int, str], List[Union[int, str]]], Dict[Union[int, str], List[Union[int, str]]], List[Union[int, str]]]:
69
+ pass
70
+
71
+ @abstractmethod
72
+ def get_sample_masks(self, state: DataStateEnum, sample_id: Union[int, str]) -> List[DatasetSample]:
73
+ pass
74
+
67
75
  @abstractmethod
68
76
  def check_dataset(self) -> DatasetIntegParseResult:
69
77
  pass
@@ -1,12 +1,13 @@
1
1
  import sys
2
2
  from pathlib import Path
3
3
  from types import TracebackType
4
- from typing import List, Union, Tuple, Any
4
+ from typing import List, Union, Tuple, Any, Callable
5
5
  import traceback
6
6
  import numpy as np
7
7
  import numpy.typing as npt
8
8
 
9
- from code_loader.contract.datasetclasses import SectionCallableInterface, PreprocessResponse
9
+ from code_loader.contract.datasetclasses import SectionCallableInterface, PreprocessResponse, \
10
+ InstanceCallableInterface
10
11
 
11
12
 
12
13
  def to_numpy_return_wrapper(encoder_function: SectionCallableInterface) -> SectionCallableInterface:
@@ -17,6 +18,14 @@ def to_numpy_return_wrapper(encoder_function: SectionCallableInterface) -> Secti
17
18
 
18
19
  return numpy_encoder_function
19
20
 
21
+ def to_numpy_return_masks_wrapper(encoder_function: InstanceCallableInterface) -> Callable[
22
+ [Union[int, str], PreprocessResponse], List[npt.NDArray[np.float32]]]:
23
+ def numpy_encoder_function(idx: Union[int, str], samples: PreprocessResponse) -> List[npt.NDArray[np.float32]]:
24
+ result = encoder_function(idx, samples)
25
+ numpy_result: List[npt.NDArray[np.float32]] = [np.array(res) for res in result]
26
+ return numpy_result
27
+ return numpy_encoder_function
28
+
20
29
 
21
30
  def get_root_traceback(exc_tb: TracebackType) -> TracebackType:
22
31
  return_traceback = exc_tb
@@ -1,6 +1,6 @@
1
1
  [tool.poetry]
2
2
  name = "code-loader"
3
- version = "1.0.91.dev4"
3
+ version = "1.0.91.dev6"
4
4
  description = ""
5
5
  authors = ["dorhar <doron.harnoy@tensorleap.ai>"]
6
6
  license = "MIT"