PyPI - tf-models-nightly - Versions diffs - 2.11.0.dev20230320__py2.py3-none-any.whl → 2.11.0.dev20230322__py2.py3-none-any.whl - Mend

tf-models-nightly 2.11.0.dev20230320py2.py3-none-any.whl → 2.11.0.dev20230322py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (16) hide show

official/projects/yt8m/tasks/yt8m_task.py CHANGED Viewed

@@ -43,25 +43,13 @@ class YT8MTask(base_task.Task):
     logging.info('Build model input %r', common_input_shape)
     l2_weight_decay = self.task_config.losses.l2_weight_decay
-    # Divide weight decay by 2.0 to match the implementation of tf.nn.l2_loss.
-    # (https://www.tensorflow.org/api_docs/python/tf/keras/regularizers/l2)
-    # (https://www.tensorflow.org/api_docs/python/tf/nn/l2_loss)
-    l2_regularizer = (
-        tf.keras.regularizers.l2(l2_weight_decay /
-                                 2.0) if l2_weight_decay else None)
     # Model configuration.
     model_config = self.task_config.model
-    norm_activation_config = model_config.norm_activation
     model = DbofModel(
         params=model_config,
         input_specs=input_specs,
-        num_frames=train_cfg.num_frames,
         num_classes=train_cfg.num_classes,
-        activation=norm_activation_config.activation,
-        use_sync_bn=norm_activation_config.use_sync_bn,
-        norm_momentum=norm_activation_config.norm_momentum,
-        norm_epsilon=norm_activation_config.norm_epsilon,
-        kernel_regularizer=l2_regularizer)
+        l2_weight_decay=l2_weight_decay)
     non_trainable_batch_norm_variables = []
     non_trainable_extra_variables = []
@@ -73,18 +61,32 @@ class YT8MTask(base_task.Task):
           non_trainable_extra_variables.append(var)
     logging.info(
-        'Trainable model variables:\n%s', '\n'.join(
-            [f'{var.name}\t{var.shape}' for var in model.trainable_variables]))
+        'Trainable model variables:\n%s',
+        '\n'.join(
+            [f'{var.name}\t{var.shape}' for var in model.trainable_variables]
+        ),
+    )
     logging.info(
-        'Non-trainable batch norm variables (get updated in training mode):\n%s',
-        '\n'.join([
-            f'{var.name}\t{var.shape}'
-            for var in non_trainable_batch_norm_variables
-        ]))
+        (
+            'Non-trainable batch norm variables (get updated in training'
+            ' mode):\n%s'
+        ),
+        '\n'.join(
+            [
+                f'{var.name}\t{var.shape}'
+                for var in non_trainable_batch_norm_variables
+            ]
+        ),
+    )
     logging.info(
-        'Non-trainable frozen model variables:\n%s', '\n'.join([
-            f'{var.name}\t{var.shape}' for var in non_trainable_extra_variables
-        ]))
+        'Non-trainable frozen model variables:\n%s',
+        '\n'.join(
+            [
+                f'{var.name}\t{var.shape}'
+                for var in non_trainable_extra_variables
+            ]
+        ),
+    )
     return model
   def build_inputs(self, params: yt8m_cfg.DataConfig, input_context=None):
@@ -180,7 +182,10 @@ class YT8MTask(base_task.Task):
     for name in metric_names:
       metrics.append(tf.keras.metrics.Mean(name, dtype=tf.float32))
-    if self.task_config.evaluation.average_precision is not None and not training:
+    if (
+        self.task_config.evaluation.average_precision is not None
+        and not training
+    ):
       # Cannot run in train step.
       num_classes = self.task_config.validation_data.num_classes
       top_k = self.task_config.evaluation.average_precision.top_k
@@ -190,14 +195,16 @@ class YT8MTask(base_task.Task):
     return metrics
-  def process_metrics(self,
-                      metrics: List[tf.keras.metrics.Metric],
-                      labels: tf.Tensor,
-                      outputs: tf.Tensor,
-                      model_losses: Optional[Dict[str, tf.Tensor]] = None,
-                      label_weights: Optional[tf.Tensor] = None,
-                      training: bool = True,
-                      **kwargs) -> Dict[str, Tuple[tf.Tensor, ...]]:
+  def process_metrics(
+      self,
+      metrics: List[tf.keras.metrics.Metric],
+      labels: tf.Tensor,
+      outputs: tf.Tensor,
+      model_losses: Optional[Dict[str, tf.Tensor]] = None,
+      label_weights: Optional[tf.Tensor] = None,
+      training: bool = True,
+      **kwargs,
+  ) -> Dict[str, Tuple[tf.Tensor, ...]]:
     """Updates metrics.
     Args:
@@ -217,7 +224,10 @@ class YT8MTask(base_task.Task):
       model_losses = {}
     logs = {}
-    if self.task_config.evaluation.average_precision is not None and not training:
+    if (
+        self.task_config.evaluation.average_precision is not None
+        and not training
+    ):
       logs.update({self.avg_prec_metric.name: (labels, outputs)})
     for m in metrics:
@@ -240,12 +250,13 @@ class YT8MTask(base_task.Task):
     # sample random frames / random sequence.
     num_frames = tf.cast(num_frames, tf.float32)
-    sample_frames = data_config.num_frames
+    num_sample_frames = data_config.num_sample_frames
     if self.task_config.model.sample_random_frames:
-      features = utils.sample_random_frames(features, num_frames, sample_frames)
+      features = utils.sample_random_frames(
+          features, num_frames, num_sample_frames)
     else:
-      features = utils.sample_random_sequence(features, num_frames,
-                                              sample_frames)
+      features = utils.sample_random_sequence(
+          features, num_frames, num_sample_frames)
     return features
   def _preprocess_labels(self,

official/vision/dataloaders/maskrcnn_input.py CHANGED Viewed

@@ -211,19 +211,18 @@ class Parser(parser.Parser):
     image = preprocess_ops.normalize_image(image)
     # Flips image randomly during training.
-    if self._aug_rand_hflip:
-      if self._include_mask:
-        image, boxes, masks = preprocess_ops.random_horizontal_flip(
-            image, boxes, masks)
-      else:
-        image, boxes, _ = preprocess_ops.random_horizontal_flip(
-            image, boxes)
-    if self._aug_rand_vflip:
-      if self._include_mask:
-        image, boxes, masks = preprocess_ops.random_vertical_flip(
-            image, boxes, masks)
-      else:
-        image, boxes, _ = preprocess_ops.random_vertical_flip(image, boxes)
+    image, boxes, masks = preprocess_ops.random_horizontal_flip(
+        image,
+        boxes,
+        masks=None if not self._include_mask else masks,
+        prob=tf.where(self._aug_rand_hflip, 0.5, 0.0),
+    )
+    image, boxes, masks = preprocess_ops.random_vertical_flip(
+        image,
+        boxes,
+        masks=None if not self._include_mask else masks,
+        prob=tf.where(self._aug_rand_vflip, 0.5, 0.0),
+    )
     # Converts boxes from normalized coordinates to pixel coordinates.
     # Now the coordinates of boxes are w.r.t. the original image.

official/vision/dataloaders/tfds_classification_decoders.py CHANGED Viewed

@@ -35,4 +35,5 @@ TFDS_ID_TO_DECODER_MAP = {
     'cifar10': ClassificationDecorder,
     'cifar100': ClassificationDecorder,
     'imagenet2012': ClassificationDecorder,
+    'imagenet2012_fewshot/10shot': ClassificationDecorder,
 }

official/vision/evaluation/instance_metrics.py CHANGED Viewed

@@ -465,213 +465,6 @@ def _count_detection_type(
   return count
-def _compute_fp_tp_gt_count(
-    y_true: Dict[str, tf.Tensor],
-    y_pred: Dict[str, tf.Tensor],
-    num_classes: int,
-    mask_output_boundary: Tuple[int, int] = (640, 640),
-    iou_thresholds: Tuple[float, ...] = (0.5,),
-    matching_algorithm: Optional[MatchingAlgorithm] = None,
-    num_confidence_bins: int = 1000,
-    use_masks: bool = False,
-) -> Tuple[tf.Tensor, tf.Tensor, tf.Tensor]:
-  """Computes the true and false positives."""
-  if matching_algorithm is None:
-    matching_algorithm = COCOMatchingAlgorithm(iou_thresholds)
-  # (batch_size, num_detections, 4) in absolute coordinates.
-  detection_boxes = tf.cast(y_pred['detection_boxes'], tf.float32)
-  # (batch_size, num_detections)
-  detection_classes = tf.cast(y_pred['detection_classes'], tf.int32)
-  # (batch_size, num_detections)
-  detection_scores = tf.cast(y_pred['detection_scores'], tf.float32)
-  # (batch_size, num_gts, 4) in absolute coordinates.
-  gt_boxes = tf.cast(y_true['boxes'], tf.float32)
-  # (batch_size, num_gts)
-  gt_classes = tf.cast(y_true['classes'], tf.int32)
-  # (batch_size, num_gts)
-  if 'is_crowds' in y_true:
-    gt_is_crowd = tf.cast(y_true['is_crowds'], tf.bool)
-  else:
-    gt_is_crowd = tf.zeros_like(gt_classes, dtype=tf.bool)
-  image_scale = tf.tile(y_true['image_info'][:, 2:3, :], multiples=[1, 1, 2])
-  detection_boxes = detection_boxes / tf.cast(
-      image_scale, dtype=detection_boxes.dtype
-  )
-  # Step 1: Computes IoUs between the detections and the non-crowd ground
-  # truths and IoAs between the detections and the crowd ground truths.
-  if not use_masks:
-    # (batch_size, num_detections, num_gts)
-    detection_to_gt_ious = box_ops.bbox_overlap(detection_boxes, gt_boxes)
-    detection_to_gt_ioas = box_ops.bbox_intersection_over_area(
-        detection_boxes, gt_boxes
-    )
-  else:
-    # (batch_size, num_detections, mask_height, mask_width)
-    detection_masks = tf.cast(y_pred['detection_masks'], tf.float32)
-    # (batch_size, num_gts, gt_mask_height, gt_mask_width)
-    gt_masks = tf.cast(y_true['masks'], tf.float32)
-    num_detections = detection_boxes.get_shape()[1]
-    # (batch_size, num_detections + num_gts, 4)
-    all_boxes = _shift_and_rescale_boxes(
-        tf.concat([detection_boxes, gt_boxes], axis=1),
-        mask_output_boundary,
-    )
-    detection_boxes = all_boxes[:, :num_detections, :]
-    gt_boxes = all_boxes[:, num_detections:, :]
-    # (batch_size, num_detections, num_gts)
-    detection_to_gt_ious, detection_to_gt_ioas = (
-        mask_ops.instance_masks_overlap(
-            detection_boxes,
-            detection_masks,
-            gt_boxes,
-            gt_masks,
-            output_size=mask_output_boundary,
-        )
-    )
-  # (batch_size, num_detections, num_gts)
-  detection_to_gt_ious = tf.where(
-      gt_is_crowd[:, tf.newaxis, :], 0.0, detection_to_gt_ious
-  )
-  detection_to_crowd_ioas = tf.where(
-      gt_is_crowd[:, tf.newaxis, :], detection_to_gt_ioas, 0.0
-  )
-  # Step 2: counts true positives grouped by IoU thresholds, classes and
-  # confidence bins.
-  # (batch_size, num_detections, num_iou_thresholds)
-  detection_is_tp, _ = matching_algorithm(
-      detection_to_gt_ious, detection_classes, detection_scores, gt_classes
-  )
-  # (batch_size * num_detections,)
-  flattened_binned_confidence = tf.reshape(
-      tf.cast(detection_scores * num_confidence_bins, tf.int32), [-1]
-  )
-  # (batch_size * num_detections, num_confidence_bins + 1)
-  flattened_binned_confidence_one_hot = tf.one_hot(
-      flattened_binned_confidence, num_confidence_bins + 1, axis=1
-  )
-  # (num_iou_thresholds, num_classes, num_confidence_bins + 1)
-  tp_count = _count_detection_type(
-      detection_is_tp,
-      detection_classes,
-      flattened_binned_confidence_one_hot,
-      num_classes,
-  )
-  # Step 3: Counts false positives grouped by IoU thresholds, classes and
-  # confidence bins.
-  # False positive: detection is not true positive (see above) and not part of
-  # the crowd ground truth with the same class.
-  # (batch_size, num_detections, num_gts, num_iou_thresholds)
-  detection_matches_crowd = (
-      (detection_to_crowd_ioas[..., tf.newaxis] > iou_thresholds)
-      & (
-          detection_classes[:, :, tf.newaxis, tf.newaxis]
-          == gt_classes[:, tf.newaxis, :, tf.newaxis]
-      )
-      & (detection_classes[:, :, tf.newaxis, tf.newaxis] > 0)
-  )
-  # (batch_size, num_detections, num_iou_thresholds)
-  detection_matches_any_crowd = tf.reduce_any(
-      detection_matches_crowd & ~detection_is_tp[:, :, tf.newaxis, :], axis=2
-  )
-  detection_is_fp = ~detection_is_tp & ~detection_matches_any_crowd
-  # (num_iou_thresholds, num_classes, num_confidence_bins + 1)
-  fp_count = _count_detection_type(
-      detection_is_fp,
-      detection_classes,
-      flattened_binned_confidence_one_hot,
-      num_classes,
-  )
-  # Step 4: Counts non-crowd groundtruths grouped by classes.
-  # (num_classes, )
-  gt_count = tf.reduce_sum(
-      tf.one_hot(
-          tf.where(gt_is_crowd, -1, gt_classes), num_classes, axis=-1
-      ),
-      axis=[0, 1],
-  )
-  # Clears the count of class 0 (background).
-  gt_count *= 1.0 - tf.eye(1, num_classes, dtype=gt_count.dtype)[0]
-  return tp_count, fp_count, gt_count
-def _compute_metrics(
-    tp_count: tf.Tensor,
-    fp_count: tf.Tensor,
-    gt_count: tf.Tensor,
-    confidence_thresholds: Tuple[float, ...] = (),
-    num_confidence_bins: int = 1000,
-    average_precision_algorithms: Optional[
-        Dict[str, AveragePrecision]] = None,
-) -> Dict[str, tf.Tensor]:
-  """Returns the metrics values as a dict."""
-  if average_precision_algorithms is None:
-    average_precision_algorithms = {'ap': COCOAveragePrecision()}
-  result = {
-      # (num_classes,)
-      'valid_classes': gt_count != 0,
-  }
-  # (num_iou_thresholds, num_classes, num_confidence_bins + 1)
-  tp_count_cum_by_confidence = tf.math.cumsum(
-      tp_count, axis=-1, reverse=True
-  )
-  # (num_iou_thresholds, num_classes, num_confidence_bins + 1)
-  fp_count_cum_by_confidence = tf.math.cumsum(
-      fp_count, axis=-1, reverse=True
-  )
-  # (num_iou_thresholds, num_classes, num_confidence_bins + 1)
-  precisions = tf.math.divide_no_nan(
-      tp_count_cum_by_confidence,
-      tp_count_cum_by_confidence + fp_count_cum_by_confidence,
-  )
-  # (num_iou_thresholds, num_classes, num_confidence_bins + 1)
-  recalls = tf.math.divide_no_nan(
-      tp_count_cum_by_confidence, gt_count[..., tf.newaxis]
-  )
-  if confidence_thresholds:
-    # If confidence_thresholds is set, reports precision and recall at each
-    # confidence threshold.
-    confidence_thresholds = tf.cast(
-        tf.constant(confidence_thresholds, dtype=tf.float32)
-        * num_confidence_bins,
-        dtype=tf.int32,
-    )
-    # (num_confidence_thresholds, num_iou_thresholds, num_classes)
-    result['precisions'] = tf.gather(
-        tf.transpose(precisions, [2, 0, 1]), confidence_thresholds
-    )
-    result['recalls'] = tf.gather(
-        tf.transpose(recalls, [2, 0, 1]), confidence_thresholds
-    )
-  precisions = tf.reverse(precisions, axis=[-1])
-  recalls = tf.reverse(recalls, axis=[-1])
-  result.update(
-      {
-          # (num_iou_thresholds, num_classes)
-          key: ap_algorithm(precisions, recalls)
-          for key, ap_algorithm in average_precision_algorithms.items()
-      }
-  )
-  return result
 class InstanceMetrics(tf.keras.metrics.Metric):
   """Reports the metrics of instance detection & segmentation."""
@@ -780,22 +573,138 @@ class InstanceMetrics(tf.keras.metrics.Metric):
   def reset_state(self):
     """Resets all of the metric state variables."""
-    for v in self.variables:
-      tf.keras.backend.set_value(v, np.zeros(v.shape))
+    self.tp_count.assign(tf.zeros_like(self.tp_count))
+    self.fp_count.assign(tf.zeros_like(self.fp_count))
+    self.gt_count.assign(tf.zeros_like(self.gt_count))
   def update_state(
       self, y_true: Dict[str, tf.Tensor], y_pred: Dict[str, tf.Tensor]
   ):
+    # (batch_size, num_detections, 4) in absolute coordinates.
+    detection_boxes = tf.cast(y_pred['detection_boxes'], tf.float32)
+    # (batch_size, num_detections)
+    detection_classes = tf.cast(y_pred['detection_classes'], tf.int32)
+    # (batch_size, num_detections)
+    detection_scores = tf.cast(y_pred['detection_scores'], tf.float32)
+    # (batch_size, num_gts, 4) in absolute coordinates.
+    gt_boxes = tf.cast(y_true['boxes'], tf.float32)
+    # (batch_size, num_gts)
+    gt_classes = tf.cast(y_true['classes'], tf.int32)
+    # (batch_size, num_gts)
+    if 'is_crowds' in y_true:
+      gt_is_crowd = tf.cast(y_true['is_crowds'], tf.bool)
+    else:
+      gt_is_crowd = tf.zeros_like(gt_classes, dtype=tf.bool)
-    tp_count, fp_count, gt_count = _compute_fp_tp_gt_count(
-        y_true=y_true,
-        y_pred=y_pred,
-        num_classes=self._num_classes,
-        mask_output_boundary=self._mask_output_boundary,
-        iou_thresholds=self._iou_thresholds,
-        matching_algorithm=self._matching_algorithm,
-        num_confidence_bins=self._num_confidence_bins,
-        use_masks=self._use_masks)
+    image_scale = tf.tile(y_true['image_info'][:, 2:3, :], multiples=[1, 1, 2])
+    detection_boxes = detection_boxes / tf.cast(
+        image_scale, dtype=detection_boxes.dtype
+    )
+    # Step 1: Computes IoUs between the detections and the non-crowd ground
+    # truths and IoAs between the detections and the crowd ground truths.
+    if not self._use_masks:
+      # (batch_size, num_detections, num_gts)
+      detection_to_gt_ious = box_ops.bbox_overlap(detection_boxes, gt_boxes)
+      detection_to_gt_ioas = box_ops.bbox_intersection_over_area(
+          detection_boxes, gt_boxes
+      )
+    else:
+      # Use outer boxes to generate the masks if available.
+      if 'detection_outer_boxes' in y_pred:
+        detection_boxes = tf.cast(y_pred['detection_outer_boxes'], tf.float32)
+      # (batch_size, num_detections, mask_height, mask_width)
+      detection_masks = tf.cast(y_pred['detection_masks'], tf.float32)
+      # (batch_size, num_gts, gt_mask_height, gt_mask_width)
+      gt_masks = tf.cast(y_true['masks'], tf.float32)
+      num_detections = detection_boxes.get_shape()[1]
+      # (batch_size, num_detections + num_gts, 4)
+      all_boxes = _shift_and_rescale_boxes(
+          tf.concat([detection_boxes, gt_boxes], axis=1),
+          self._mask_output_boundary,
+      )
+      detection_boxes = all_boxes[:, :num_detections, :]
+      gt_boxes = all_boxes[:, num_detections:, :]
+      # (batch_size, num_detections, num_gts)
+      detection_to_gt_ious, detection_to_gt_ioas = (
+          mask_ops.instance_masks_overlap(
+              detection_boxes,
+              detection_masks,
+              gt_boxes,
+              gt_masks,
+              output_size=self._mask_output_boundary,
+          )
+      )
+    # (batch_size, num_detections, num_gts)
+    detection_to_gt_ious = tf.where(
+        gt_is_crowd[:, tf.newaxis, :], 0.0, detection_to_gt_ious
+    )
+    detection_to_crowd_ioas = tf.where(
+        gt_is_crowd[:, tf.newaxis, :], detection_to_gt_ioas, 0.0
+    )
+    # Step 2: counts true positives grouped by IoU thresholds, classes and
+    # confidence bins.
+    # (batch_size, num_detections, num_iou_thresholds)
+    detection_is_tp, _ = self._matching_algorithm(
+        detection_to_gt_ious, detection_classes, detection_scores, gt_classes
+    )
+    # (batch_size * num_detections,)
+    flattened_binned_confidence = tf.reshape(
+        tf.cast(detection_scores * self._num_confidence_bins, tf.int32), [-1]
+    )
+    # (batch_size * num_detections, num_confidence_bins + 1)
+    flattened_binned_confidence_one_hot = tf.one_hot(
+        flattened_binned_confidence, self._num_confidence_bins + 1, axis=1
+    )
+    # (num_iou_thresholds, num_classes, num_confidence_bins + 1)
+    tp_count = _count_detection_type(
+        detection_is_tp,
+        detection_classes,
+        flattened_binned_confidence_one_hot,
+        self._num_classes,
+    )
+    # Step 3: Counts false positives grouped by IoU thresholds, classes and
+    # confidence bins.
+    # False positive: detection is not true positive (see above) and not part of
+    # the crowd ground truth with the same class.
+    # (batch_size, num_detections, num_gts, num_iou_thresholds)
+    detection_matches_crowd = (
+        (detection_to_crowd_ioas[..., tf.newaxis] > self._iou_thresholds)
+        & (
+            detection_classes[:, :, tf.newaxis, tf.newaxis]
+            == gt_classes[:, tf.newaxis, :, tf.newaxis]
+        )
+        & (detection_classes[:, :, tf.newaxis, tf.newaxis] > 0)
+    )
+    # (batch_size, num_detections, num_iou_thresholds)
+    detection_matches_any_crowd = tf.reduce_any(
+        detection_matches_crowd & ~detection_is_tp[:, :, tf.newaxis, :], axis=2
+    )
+    detection_is_fp = ~detection_is_tp & ~detection_matches_any_crowd
+    # (num_iou_thresholds, num_classes, num_confidence_bins + 1)
+    fp_count = _count_detection_type(
+        detection_is_fp,
+        detection_classes,
+        flattened_binned_confidence_one_hot,
+        self._num_classes,
+    )
+    # Step 4: Counts non-crowd groundtruths grouped by classes.
+    # (num_classes, )
+    gt_count = tf.reduce_sum(
+        tf.one_hot(
+            tf.where(gt_is_crowd, -1, gt_classes), self._num_classes, axis=-1
+        ),
+        axis=[0, 1],
+    )
+    # Clears the count of class 0 (background).
+    gt_count *= 1.0 - tf.eye(1, self._num_classes, dtype=gt_count.dtype)[0]
     # Accumulates the variables.
     self.fp_count.assign_add(tf.cast(fp_count, self.fp_count.dtype))
@@ -818,13 +727,55 @@ class InstanceMetrics(tf.keras.metrics.Metric):
         'valid_classes': a bool tensor in shape (num_classes,). If False, there
         is no instance of the class in the ground truth.
     """
-    result = _compute_metrics(
-        fp_count=self.fp_count,
-        tp_count=self.tp_count,
-        gt_count=self.gt_count,
-        confidence_thresholds=self._confidence_thresholds,
-        num_confidence_bins=self._num_confidence_bins,
-        average_precision_algorithms=self._average_precision_algorithms)
+    result = {
+        # (num_classes,)
+        'valid_classes': self.gt_count != 0,
+    }
+    # (num_iou_thresholds, num_classes, num_confidence_bins + 1)
+    tp_count_cum_by_confidence = tf.math.cumsum(
+        self.tp_count, axis=-1, reverse=True
+    )
+    # (num_iou_thresholds, num_classes, num_confidence_bins + 1)
+    fp_count_cum_by_confidence = tf.math.cumsum(
+        self.fp_count, axis=-1, reverse=True
+    )
+    # (num_iou_thresholds, num_classes, num_confidence_bins + 1)
+    precisions = tf.math.divide_no_nan(
+        tp_count_cum_by_confidence,
+        tp_count_cum_by_confidence + fp_count_cum_by_confidence,
+    )
+    # (num_iou_thresholds, num_classes, num_confidence_bins + 1)
+    recalls = tf.math.divide_no_nan(
+        tp_count_cum_by_confidence, self.gt_count[..., tf.newaxis]
+    )
+    if self._confidence_thresholds:
+      # If confidence_thresholds is set, reports precision and recall at each
+      # confidence threshold.
+      confidence_thresholds = tf.cast(
+          tf.constant(self._confidence_thresholds, dtype=tf.float32)
+          * self._num_confidence_bins,
+          dtype=tf.int32,
+      )
+      # (num_confidence_thresholds, num_iou_thresholds, num_classes)
+      result['precisions'] = tf.gather(
+          tf.transpose(precisions, [2, 0, 1]), confidence_thresholds
+      )
+      result['recalls'] = tf.gather(
+          tf.transpose(recalls, [2, 0, 1]), confidence_thresholds
+      )
+    precisions = tf.reverse(precisions, axis=[-1])
+    recalls = tf.reverse(recalls, axis=[-1])
+    result.update(
+        {
+            # (num_iou_thresholds, num_classes)
+            key: ap_algorithm(precisions, recalls)
+            for key, ap_algorithm in self._average_precision_algorithms.items()
+        }
+    )
     return result
   def get_average_precision_metrics_keys(self):

official/vision/ops/preprocess_ops.py CHANGED Viewed

@@ -182,7 +182,12 @@ def resize_and_crop_image(image,
   with tf.name_scope('resize_and_crop_image'):
     image_size = tf.cast(tf.shape(image)[0:2], tf.float32)
-    random_jittering = (aug_scale_min != 1.0 or aug_scale_max != 1.0)
+    random_jittering = (
+        isinstance(aug_scale_min, tf.Tensor)
+        or isinstance(aug_scale_max, tf.Tensor)
+        or not math.isclose(aug_scale_min, 1.0)
+        or not math.isclose(aug_scale_max, 1.0)
+    )
     if random_jittering:
       random_scale = tf.random.uniform(
@@ -292,7 +297,12 @@ def resize_and_crop_image_v2(image,
         scaled_size)
     desired_size = scaled_size
-    random_jittering = (aug_scale_min != 1.0 or aug_scale_max != 1.0)
+    random_jittering = (
+        isinstance(aug_scale_min, tf.Tensor)
+        or isinstance(aug_scale_max, tf.Tensor)
+        or not math.isclose(aug_scale_min, 1.0)
+        or not math.isclose(aug_scale_max, 1.0)
+    )
     if random_jittering:
       random_scale = tf.random.uniform(
@@ -641,10 +651,12 @@ def horizontal_flip_masks(masks):
   return masks[:, :, ::-1]
-def random_horizontal_flip(image, normalized_boxes=None, masks=None, seed=1):
+def random_horizontal_flip(
+    image, normalized_boxes=None, masks=None, seed=1, prob=0.5
+):
   """Randomly flips input image and bounding boxes horizontally."""
   with tf.name_scope('random_horizontal_flip'):
-    do_flip = tf.greater(tf.random.uniform([], seed=seed), 0.5)
+    do_flip = tf.less(tf.random.uniform([], seed=seed), prob)
     image = tf.cond(
         do_flip,
@@ -713,10 +725,12 @@ def random_horizontal_flip_with_roi(
     return image, boxes, masks, roi_boxes
-def random_vertical_flip(image, normalized_boxes=None, masks=None, seed=1):
+def random_vertical_flip(
+    image, normalized_boxes=None, masks=None, seed=1, prob=0.5
+):
   """Randomly flips input image and bounding boxes vertically."""
   with tf.name_scope('random_vertical_flip'):
-    do_flip = tf.greater(tf.random.uniform([], seed=seed), 0.5)
+    do_flip = tf.less(tf.random.uniform([], seed=seed), prob)
     image = tf.cond(
         do_flip,

{tf_models_nightly-2.11.0.dev20230320.dist-info → tf_models_nightly-2.11.0.dev20230322.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: tf-models-nightly
-Version: 2.11.0.dev20230320
+Version: 2.11.0.dev20230322
 Summary: TensorFlow Official Models
 Home-page: https://github.com/tensorflow/models
 Author: Google Inc.

tf-models-nightly 2.11.0.dev20230320__py2.py3-none-any.whl → 2.11.0.dev20230322__py2.py3-none-any.whl

tf-models-nightly 2.11.0.dev20230320py2.py3-none-any.whl → 2.11.0.dev20230322py2.py3-none-any.whl