forked from SciSharp/TensorFlow.NET
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathtf.image.cs
More file actions
257 lines (199 loc) · 17 KB
/
tf.image.cs
File metadata and controls
257 lines (199 loc) · 17 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
/*****************************************************************************
Copyright 2018 The TensorFlow.NET Authors. All Rights Reserved.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
******************************************************************************/
using System.Collections.Generic;
using Tensorflow.IO;
using static Tensorflow.Binding;
namespace Tensorflow
{
public partial class tensorflow
{
public image_internal image = new image_internal();
public class image_internal
{
public Tensor random_flip_up_down(Tensor image, int seed = 0)
=> image_ops_impl.random_flip_up_down(image, seed);
public Tensor random_flip_left_right(Tensor image, int seed = 0)
=> image_ops_impl.random_flip_left_right(image, seed);
public Tensor flip_left_right(Tensor image)
=> image_ops_impl.flip_left_right(image);
public Tensor flip_up_down(Tensor image)
=> image_ops_impl.flip_up_down(image);
public Tensor rot90(Tensor image, int k = 1, string name = null)
=> image_ops_impl.rot90(image, k, name);
public Tensor transpose(Tensor image, string name = null)
=> image_ops_impl.transpose(image, name);
public Tensor central_crop(Tensor image, float central_fraction)
=> image_ops_impl.central_crop(image, central_fraction);
public Tensor pad_to_bounding_box(Tensor image, int offset_height, int offset_width, int target_height, int target_width)
=> image_ops_impl.pad_to_bounding_box(image, offset_height, offset_width, target_height, target_width);
public Tensor crop_to_bounding_box(Tensor image, int offset_height, int offset_width, int target_height, int target_width)
=> image_ops_impl.crop_to_bounding_box(image, offset_height, offset_width, target_height, target_width);
public Tensor resize_image_with_crop_or_pad(Tensor image, object target_height, object target_width)
=> image_ops_impl.resize_image_with_crop_or_pad(image, target_height, target_width);
public Tensor resize_images(Tensor images, Tensor size, string method = ResizeMethod.BILINEAR, bool preserve_aspect_ratio = false, bool antialias = false,
string name = null)
=> image_ops_impl.resize_images(images, size, method, preserve_aspect_ratio, antialias, name);
public Tensor resize_images_v2(Tensor images, TensorShape size, string method = ResizeMethod.BILINEAR, bool preserve_aspect_ratio = false, bool antialias = false,
string name = null)
=> image_ops_impl.resize_images(images, tf.constant(size.dims), method, preserve_aspect_ratio, antialias, name);
public Tensor resize_images_with_pad(Tensor image, int target_height, int target_width, string method, bool antialias)
=> image_ops_impl.resize_images_with_pad(image, target_height, target_width, method, antialias);
public Tensor per_image_standardization(Tensor image)
=> image_ops_impl.per_image_standardization(image);
public Tensor random_brightness(Tensor image, float max_delta, int seed = 0)
=> image_ops_impl.random_brightness(image, max_delta, seed);
public Tensor random_contrast(Tensor image, float lower, float upper, int seed = 0)
=> image_ops_impl.random_contrast(image, lower, upper, seed);
public Tensor adjust_brightness(Tensor image, Tensor delta)
=> image_ops_impl.adjust_brightness(image, delta);
public Tensor adjust_contrast(Tensor images, Tensor contrast_factor)
=> image_ops_impl.adjust_contrast(images, contrast_factor);
public Tensor adjust_gamma(Tensor image, int gamma = 1, int gain = 1)
=> image_ops_impl.adjust_gamma(image, gamma, gain);
public Tensor rgb_to_grayscale(Tensor images, string name = null)
=> image_ops_impl.rgb_to_grayscale(images, name);
public Tensor grayscale_to_rgb(Tensor images, string name = null)
=> image_ops_impl.grayscale_to_rgb(images, name);
public Tensor random_hue(Tensor image, float max_delta, int seed = 0)
=> image_ops_impl.random_hue(image, max_delta, seed);
public Tensor adjust_hue(Tensor image, Tensor delta, string name = null)
=> image_ops_impl.adjust_hue(image, delta, name);
public Tensor random_jpeg_quality(Tensor image, float min_jpeg_quality, float max_jpeg_quality, int seed = 0)
=> image_ops_impl.random_jpeg_quality(image, min_jpeg_quality, max_jpeg_quality, seed);
public Tensor adjust_jpeg_quality(Tensor image, Tensor jpeg_quality, string name = null)
=> image_ops_impl.adjust_jpeg_quality(image, jpeg_quality, name);
public Tensor random_saturation(Tensor image, float lower, float upper, int seed = 0)
=> image_ops_impl.random_saturation(image, lower, upper, seed);
public Tensor adjust_saturation(Tensor image, Tensor saturation_factor, string name = null)
=> image_ops_impl.adjust_saturation(image, saturation_factor, name);
public Tensor total_variation(Tensor images, string name = null)
=> image_ops_impl.total_variation(images, name);
public (Tensor, Tensor, Tensor) sample_distorted_bounding_box(Tensor image_size, Tensor bounding_boxes,
int seed = 0,
Tensor min_object_covered = null,
float[] aspect_ratio_range = null,
float[] area_range = null,
int max_attempts = 100,
bool use_image_if_no_bounding_boxes = false,
string name = null)
=> image_ops_impl.sample_distorted_bounding_box_v2(image_size, bounding_boxes, seed, min_object_covered, aspect_ratio_range,
area_range, max_attempts, use_image_if_no_bounding_boxes, name);
public Tensor non_max_suppression(Tensor boxes, Tensor scores, Tensor max_output_size, float iou_threshold = 0.5f,
float score_threshold = -1f / 0f, /*float soft_nms_sigma = 0.0f,*/ string name = null)
=> image_ops_impl.non_max_suppression(boxes, scores, max_output_size, iou_threshold, score_threshold, name);
public Tensor non_max_suppression_with_overlaps(Tensor overlaps, Tensor scores, Tensor max_output_size,
float overlap_threshold = 0.5f, float score_threshold = -1 / 0f, string name = null)
=> image_ops_impl.non_max_suppression_with_overlaps(overlaps, scores, max_output_size, overlap_threshold, score_threshold, name);
public Tensor rgb_to_yiq(Tensor images)
=> image_ops_impl.rgb_to_yiq(images);
public Tensor yiq_to_rgb(Tensor images)
=> image_ops_impl.yiq_to_rgb(images);
public Tensor rgb_to_yuv(Tensor images)
=> image_ops_impl.rgb_to_yuv(images);
public Tensor yuv_to_rgb(Tensor images)
=> image_ops_impl.yuv_to_rgb(images);
public Tensor psnr(Tensor a, Tensor b, Tensor max_val, string name = null)
=> image_ops_impl.psnr(a, b, max_val, name);
public Tensor ssim(Tensor img1, Tensor img2, float max_val = 1f, float filter_size = 11f, float filter_sigma = 1.5f,
float k1 = 0.01f, float k2 = 0.03f)
=> image_ops_impl.ssim(img1, img2, max_val, filter_size, filter_sigma, k1, k2);
public Tensor ssim_multiscale(Tensor img1, Tensor img2, float max_val, float[] power_factors = null, float filter_size = 11f,
float filter_sigma = 1.5f, float k1 = 0.01f, float k2 = 0.03f)
=> image_ops_impl.ssim_multiscale(img1, img2, max_val, power_factors, filter_size, filter_sigma, k1, k2);
public (Tensor, Tensor) image_gradients(Tensor image)
=> image_ops_impl.image_gradients(image);
public Tensor sobel_edges(Tensor image)
=> image_ops_impl.sobel_edges(image);
public Tensor decode_jpeg(Tensor contents,
int channels = 0,
int ratio = 1,
bool fancy_upscaling = true,
bool try_recover_truncated = false,
int acceptable_fraction = 1,
string dct_method = "",
string name = null)
=> gen_image_ops.decode_jpeg(contents, channels: channels, ratio: ratio,
fancy_upscaling: fancy_upscaling, try_recover_truncated: try_recover_truncated,
acceptable_fraction: acceptable_fraction, dct_method: dct_method);
/// <summary>
/// Extracts crops from the input image tensor and resizes them using bilinear sampling or nearest neighbor sampling (possibly with aspect ratio change) to a common output size specified by crop_size. This is more general than the crop_to_bounding_box op which extracts a fixed size slice from the input image and does not allow resizing or aspect ratio change.
/// Returns a tensor with crops from the input image at positions defined at the bounding box locations in boxes.The cropped boxes are all resized(with bilinear or nearest neighbor interpolation) to a fixed size = [crop_height, crop_width].The result is a 4 - D tensor[num_boxes, crop_height, crop_width, depth].The resizing is corner aligned. In particular, if boxes = [[0, 0, 1, 1]], the method will give identical results to using tf.image.resize_bilinear() or tf.image.resize_nearest_neighbor() (depends on the method argument) with align_corners = True.
/// </summary>
/// <param name="image">A Tensor. Must be one of the following types: uint8, uint16, int8, int16, int32, int64, half, float32, float64. A 4-D tensor of shape [batch, image_height, image_width, depth]. Both image_height and image_width need to be positive.</param>
/// <param name="boxes">A Tensor of type float32. A 2-D tensor of shape [num_boxes, 4]. The i-th row of the tensor specifies the coordinates of a box in the box_ind[i] image and is specified in normalized coordinates [y1, x1, y2, x2]. A normalized coordinate value of y is mapped to the image coordinate at y * (image_height - 1), so as the [0, 1] interval of normalized image height is mapped to [0, image_height - 1] in image height coordinates. We do allow y1 > y2, in which case the sampled crop is an up-down flipped version of the original image. The width dimension is treated similarly. Normalized coordinates outside the [0, 1] range are allowed, in which case we use extrapolation_value to extrapolate the input image values.</param>
/// <param name="box_ind">A Tensor of type int32. A 1-D tensor of shape [num_boxes] with int32 values in [0, batch). The value of box_ind[i] specifies the image that the i-th box refers to.</param>
/// <param name="crop_size">A Tensor of type int32. A 1-D tensor of 2 elements, size = [crop_height, crop_width]. All cropped image patches are resized to this size. The aspect ratio of the image content is not preserved. Both crop_height and crop_width need to be positive.</param>
/// <param name="method">An optional string from: "bilinear", "nearest". Defaults to "bilinear". A string specifying the sampling method for resizing. It can be either "bilinear" or "nearest" and default to "bilinear". Currently two sampling methods are supported: Bilinear and Nearest Neighbor.</param>
/// <param name="extrapolation_value">An optional float. Defaults to 0. Value used for extrapolation, when applicable.</param>
/// <param name="name">A name for the operation (optional).</param>
/// <returns>A 4-D tensor of shape [num_boxes, crop_height, crop_width, depth].</returns>
public Tensor crop_and_resize(Tensor image, Tensor boxes, Tensor box_ind, Tensor crop_size, string method = "bilinear", float extrapolation_value = 0f, string name = null) =>
image_ops_impl.crop_and_resize(image, boxes, box_ind, crop_size, method, extrapolation_value, name);
public Tensor extract_glimpse(Tensor input, Tensor size, Tensor offsets, bool centered = true, bool normalized = true,
bool uniform_noise = true, string name = null)
=> image_ops_impl.extract_glimpse(input, size, offsets, centered, normalized, uniform_noise, name);
public (Tensor, Tensor, Tensor, Tensor) combined_non_max_suppression(Tensor boxes, Tensor scores, Tensor max_output_size_per_class,
Tensor max_total_size, float iou_threshold = 0.5f, float score_threshold = -1f / 0f, bool pad_per_class = false, bool clip_boxes = true,
string name = null)
=> image_ops_impl.combined_non_max_suppression(boxes, scores, max_output_size_per_class, max_total_size, iou_threshold, score_threshold,
pad_per_class, clip_boxes, name);
public (Tensor, Tensor) non_max_suppression_padded(Tensor boxes, Tensor scores, Tensor max_output_size,
float iou_threshold = 0.5f,
float score_threshold = -1f / 0f,
bool pad_to_max_output_size = false,
string name = null,
bool sorted_input = false,
bool canonicalized_coordinates = false,
int tile_size = 512)
=> image_ops_impl.non_max_suppression_padded(boxes, scores, max_output_size, iou_threshold, score_threshold, pad_to_max_output_size,
name, sorted_input, canonicalized_coordinates, tile_size);
public Tensor resize(Tensor image, TensorShape size, string method = ResizeMethod.BILINEAR)
=> image_ops_impl.resize_images_v2(image, size, method: method);
public Tensor resize_bilinear(Tensor images, Tensor size, bool align_corners = false, bool half_pixel_centers = false, string name = null)
=> gen_image_ops.resize_bilinear(images, size, align_corners: align_corners, half_pixel_centers: half_pixel_centers, name: name);
public Tensor resize_images(Tensor images, Tensor size, string method = ResizeMethod.BILINEAR,
bool preserve_aspect_ratio = false, string name = null)
=> image_ops_impl.resize_images(images, size, method: method,
preserve_aspect_ratio: preserve_aspect_ratio, name: name);
public Tensor convert_image_dtype(Tensor image, TF_DataType dtype, bool saturate = false, string name = null)
=> gen_image_ops.convert_image_dtype(image, dtype, saturate: saturate, name: name);
public Tensor decode_image(Tensor contents, int channels = 0, TF_DataType dtype = TF_DataType.TF_UINT8,
string name = null, bool expand_animations = true)
=> image_ops_impl.decode_image(contents, channels: channels, dtype: dtype,
name: name, expand_animations: expand_animations);
/// <summary>
/// Convenience function to check if the 'contents' encodes a JPEG image.
/// </summary>
/// <param name="contents"></param>
/// <param name="name"></param>
/// <returns></returns>
public Tensor is_jpeg(Tensor contents, string name = null)
=> image_ops_impl.is_jpeg(contents, name: name);
/// <summary>
/// Resize `images` to `size` using nearest neighbor interpolation.
/// </summary>
/// <param name="images"></param>
/// <param name="size"></param>
/// <param name="align_corners"></param>
/// <param name="name"></param>
/// <param name="half_pixel_centers"></param>
/// <returns></returns>
public Tensor resize_nearest_neighbor<Tsize>(Tensor images, Tsize size, bool align_corners = false,
string name = null, bool half_pixel_centers = false)
=> image_ops_impl.resize_nearest_neighbor(images, size, align_corners: align_corners,
name: name, half_pixel_centers: half_pixel_centers);
public Tensor draw_bounding_boxes(Tensor images, Tensor boxes, Tensor colors = null, string name = null)
=> image_ops_impl.draw_bounding_boxes(images, boxes, colors, name);
}
}
}