Spaces:
Sleeping
Sleeping
# Copyright 2018 The TensorFlow Authors. All Rights Reserved. | |
# | |
# Licensed under the Apache License, Version 2.0 (the "License"); | |
# you may not use this file except in compliance with the License. | |
# You may obtain a copy of the License at | |
# | |
# http://www.apache.org/licenses/LICENSE-2.0 | |
# | |
# Unless required by applicable law or agreed to in writing, software | |
# distributed under the License is distributed on an "AS IS" BASIS, | |
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | |
# See the License for the specific language governing permissions and | |
# limitations under the License. | |
# ============================================================================== | |
"""Image summaries and TensorFlow operations to create them, V2 versions. | |
An image summary stores the width, height, and PNG-encoded data for zero | |
or more images in a rank-1 string array: `[w, h, png0, png1, ...]`. | |
""" | |
from tensorboard.compat import tf2 as tf | |
from tensorboard.plugins.image import metadata | |
from tensorboard.util import lazy_tensor_creator | |
def image(name, data, step=None, max_outputs=3, description=None): | |
"""Write an image summary. | |
See also `tf.summary.scalar`, `tf.summary.SummaryWriter`. | |
Writes a collection of images to the current default summary writer. Data | |
appears in TensorBoard's 'Images' dashboard. Like `tf.summary.scalar` points, | |
each collection of images is associated with a `step` and a `name`. All the | |
image collections with the same `name` constitute a time series of image | |
collections. | |
This example writes 2 random grayscale images: | |
```python | |
w = tf.summary.create_file_writer('test/logs') | |
with w.as_default(): | |
image1 = tf.random.uniform(shape=[8, 8, 1]) | |
image2 = tf.random.uniform(shape=[8, 8, 1]) | |
tf.summary.image("grayscale_noise", [image1, image2], step=0) | |
``` | |
To avoid clipping, data should be converted to one of the following: | |
- floating point values in the range [0,1], or | |
- uint8 values in the range [0,255] | |
```python | |
# Convert the original dtype=int32 `Tensor` into `dtype=float64`. | |
rgb_image_float = tf.constant([ | |
[[1000, 0, 0], [0, 500, 1000]], | |
]) / 1000 | |
tf.summary.image("picture", [rgb_image_float], step=0) | |
# Convert original dtype=uint8 `Tensor` into proper range. | |
rgb_image_uint8 = tf.constant([ | |
[[1, 1, 0], [0, 0, 1]], | |
], dtype=tf.uint8) * 255 | |
tf.summary.image("picture", [rgb_image_uint8], step=1) | |
``` | |
Arguments: | |
name: A name for this summary. The summary tag used for TensorBoard will | |
be this name prefixed by any active name scopes. | |
data: A `Tensor` representing pixel data with shape `[k, h, w, c]`, | |
where `k` is the number of images, `h` and `w` are the height and | |
width of the images, and `c` is the number of channels, which | |
should be 1, 2, 3, or 4 (grayscale, grayscale with alpha, RGB, RGBA). | |
Any of the dimensions may be statically unknown (i.e., `None`). | |
Floating point data will be clipped to the range [0,1]. Other data types | |
will be clipped into an allowed range for safe casting to uint8, using | |
`tf.image.convert_image_dtype`. | |
step: Explicit `int64`-castable monotonic step value for this summary. If | |
omitted, this defaults to `tf.summary.experimental.get_step()`, which must | |
not be None. | |
max_outputs: Optional `int` or rank-0 integer `Tensor`. At most this | |
many images will be emitted at each step. When more than | |
`max_outputs` many images are provided, the first `max_outputs` many | |
images will be used and the rest silently discarded. | |
description: Optional long-form description for this summary, as a | |
constant `str`. Markdown is supported. Defaults to empty. | |
Returns: | |
True on success, or false if no summary was emitted because no default | |
summary writer was available. | |
Raises: | |
ValueError: if a default writer exists, but no step was provided and | |
`tf.summary.experimental.get_step()` is None. | |
""" | |
summary_metadata = metadata.create_summary_metadata( | |
display_name=None, description=description | |
) | |
# TODO(https://github.com/tensorflow/tensorboard/issues/2109): remove fallback | |
summary_scope = ( | |
getattr(tf.summary.experimental, "summary_scope", None) | |
or tf.summary.summary_scope | |
) | |
with summary_scope( | |
name, "image_summary", values=[data, max_outputs, step] | |
) as (tag, _): | |
# Defer image encoding preprocessing by passing it as a callable to write(), | |
# wrapped in a LazyTensorCreator for backwards compatibility, so that we | |
# only do this work when summaries are actually written. | |
def lazy_tensor(): | |
tf.debugging.assert_rank(data, 4) | |
tf.debugging.assert_non_negative(max_outputs) | |
images = tf.image.convert_image_dtype(data, tf.uint8, saturate=True) | |
limited_images = images[:max_outputs] | |
encoded_images = tf.image.encode_png(limited_images) | |
image_shape = tf.shape(input=images) | |
dimensions = tf.stack( | |
[ | |
tf.as_string(image_shape[2], name="width"), | |
tf.as_string(image_shape[1], name="height"), | |
], | |
name="dimensions", | |
) | |
return tf.concat([dimensions, encoded_images], axis=0) | |
# To ensure that image encoding logic is only executed when summaries | |
# are written, we pass callable to `tensor` parameter. | |
return tf.summary.write( | |
tag=tag, tensor=lazy_tensor, step=step, metadata=summary_metadata | |
) | |