Skip to content

Commit d01b591

Browse files
committed
Add decode_yuy2 (YUYV/YUY2/YUYV422) support
This PR adds support of decode_yuy2 to allow convert yuy2 to rgb. This is useful for Video Capture in Linux (Video4Linux2) as the default format is YUYV. This PR fixes tensorflow#825 Signed-off-by: Yong Tang <yong.tang.github@outlook.com>
1 parent 5b80b1d commit d01b591

File tree

11 files changed

+130
-3
lines changed

11 files changed

+130
-3
lines changed

tensorflow_io/core/BUILD

+1
Original file line numberDiff line numberDiff line change
@@ -168,6 +168,7 @@ cc_library(
168168
"kernels/image_pnm_kernels.cc",
169169
"kernels/image_tiff_kernels.cc",
170170
"kernels/image_webp_kernels.cc",
171+
"kernels/image_yuy2_kernels.cc",
171172
"ops/image_ops.cc",
172173
],
173174
copts = tf_io_copts(),
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,79 @@
1+
/* Copyright 2020 The TensorFlow Authors. All Rights Reserved.
2+
3+
Licensed under the Apache License, Version 2.0 (the "License");
4+
you may not use this file except in compliance with the License.
5+
You may obtain a copy of the License at
6+
7+
http://www.apache.org/licenses/LICENSE-2.0
8+
9+
Unless required by applicable law or agreed to in writing, software
10+
distributed under the License is distributed on an "AS IS" BASIS,
11+
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+
See the License for the specific language governing permissions and
13+
limitations under the License.
14+
==============================================================================*/
15+
16+
#include "tensorflow/core/framework/op_kernel.h"
17+
#include "tensorflow_io/core/kernels/io_stream.h"
18+
19+
#include "libyuv/convert_argb.h"
20+
#include "libyuv/convert_from_argb.h"
21+
22+
namespace tensorflow {
23+
namespace io {
24+
namespace {
25+
26+
class DecodeYUY2Op : public OpKernel {
27+
public:
28+
explicit DecodeYUY2Op(OpKernelConstruction* context) : OpKernel(context) {
29+
env_ = context->env();
30+
}
31+
32+
void Compute(OpKernelContext* context) override {
33+
const Tensor* input_tensor;
34+
OP_REQUIRES_OK(context, context->input("input", &input_tensor));
35+
36+
const Tensor* size_tensor;
37+
OP_REQUIRES_OK(context, context->input("size", &size_tensor));
38+
39+
const tstring& input = input_tensor->scalar<tstring>()();
40+
41+
int64 channels = 3;
42+
int64 height = size_tensor->flat<int32>()(0);
43+
int64 width = size_tensor->flat<int32>()(1);
44+
45+
Tensor* image_tensor = nullptr;
46+
OP_REQUIRES_OK(
47+
context, context->allocate_output(
48+
0, TensorShape({height, width, channels}), &image_tensor));
49+
50+
string buffer;
51+
buffer.resize(width * height * 4);
52+
uint8* argb = (uint8*)&buffer[0];
53+
uint8* yuy2 = (uint8*)&input[0];
54+
uint32 yuy2_stride = width * 2;
55+
uint32 argb_stride = width * 4;
56+
int status =
57+
libyuv::YUY2ToARGB(yuy2, yuy2_stride, argb, argb_stride, width, height);
58+
OP_REQUIRES(
59+
context, (status == 0),
60+
errors::InvalidArgument("unable to convert yuy2 to argb: ", status));
61+
62+
uint8* rgb = image_tensor->flat<uint8>().data();
63+
uint32 rgb_stride = width * 3;
64+
status =
65+
libyuv::ARGBToRAW(argb, argb_stride, rgb, rgb_stride, width, height);
66+
OP_REQUIRES(
67+
context, (status == 0),
68+
errors::InvalidArgument("unable to convert argb to rgb: ", status));
69+
}
70+
71+
private:
72+
mutex mu_;
73+
Env* env_ GUARDED_BY(mu_);
74+
};
75+
REGISTER_KERNEL_BUILDER(Name("IO>DecodeYUY2").Device(DEVICE_CPU), DecodeYUY2Op);
76+
77+
} // namespace
78+
} // namespace io
79+
} // namespace tensorflow

tensorflow_io/core/ops/image_ops.cc

+11
Original file line numberDiff line numberDiff line change
@@ -183,6 +183,17 @@ REGISTER_OP("IO>DecodeNV12")
183183
return Status::OK();
184184
});
185185

186+
REGISTER_OP("IO>DecodeYUY2")
187+
.Input("input: string")
188+
.Input("size: int32")
189+
.Output("image: uint8")
190+
.SetShapeFn([](shape_inference::InferenceContext* c) {
191+
shape_inference::ShapeHandle unused;
192+
TF_RETURN_IF_ERROR(c->WithRank(c->input(0), 0, &unused));
193+
c->set_output(0, c->MakeShape({c->UnknownDim(), c->UnknownDim(), 3}));
194+
return Status::OK();
195+
});
196+
186197
} // namespace
187198
} // namespace io
188199
} // namespace tensorflow

tensorflow_io/core/python/api/experimental/image.py

+1
Original file line numberDiff line numberDiff line change
@@ -24,4 +24,5 @@
2424
decode_pnm,
2525
decode_hdr,
2626
decode_nv12,
27+
decode_yuy2,
2728
)

tensorflow_io/core/python/experimental/image_ops.py

+17-1
Original file line numberDiff line numberDiff line change
@@ -137,7 +137,7 @@ def decode_pnm(contents, dtype=tf.uint8, name=None):
137137

138138
def decode_hdr(contents, name=None):
139139
"""
140-
Decode a HDR-encoded image to a uint8 tensor.
140+
Decode a HDR-encoded image to a tf.float tensor.
141141
142142
Args:
143143
contents: A `Tensor` of type `string`. 0-D. The HDR-encoded image.
@@ -163,3 +163,19 @@ def decode_nv12(contents, size, name=None):
163163
A `Tensor` of type `uint8` and shape of `[height, width, 3]` (RGB).
164164
"""
165165
return core_ops.io_decode_nv12(contents, size=size, name=name)
166+
167+
168+
def decode_yuy2(contents, size, name=None):
169+
"""
170+
Decode a YUY2-encoded image to a uint8 tensor.
171+
172+
Args:
173+
contents: A `Tensor` of type `string`. 0-D. The YUY2-encoded image.
174+
size: A 1-D int32 Tensor of 2 elements: height, width. The size
175+
for the images.
176+
name: A name for the operation (optional).
177+
178+
Returns:
179+
A `Tensor` of type `uint8` and shape of `[height, width, 3]` (RGB).
180+
"""
181+
return core_ops.io_decode_yuy2(contents, size=size, name=name)
File renamed without changes.
File renamed without changes.

tests/test_image/Jelly-Beans.yuy2

+1
Large diffs are not rendered by default.

tests/test_image/Jelly-Beans.yuy2.png

73.5 KB
Loading

tests/test_image_eager.py

+19-2
Original file line numberDiff line numberDiff line change
@@ -294,10 +294,10 @@ def test_decode_hdr():
294294
def test_decode_nv12():
295295
"""Test case for decode_nv12"""
296296
filename = os.path.join(
297-
os.path.dirname(os.path.abspath(__file__)), "test_image", "Jelly-Beans.yuv"
297+
os.path.dirname(os.path.abspath(__file__)), "test_image", "Jelly-Beans.nv12"
298298
)
299299
png_filename = os.path.join(
300-
os.path.dirname(os.path.abspath(__file__)), "test_image", "Jelly-Beans.png"
300+
os.path.dirname(os.path.abspath(__file__)), "test_image", "Jelly-Beans.nv12.png"
301301
)
302302
png = tf.image.decode_png(tf.io.read_file(png_filename))
303303

@@ -308,5 +308,22 @@ def test_decode_nv12():
308308
assert np.all(rgb == png)
309309

310310

311+
def test_decode_yuy2():
312+
"""Test case for decode_yuy2"""
313+
filename = os.path.join(
314+
os.path.dirname(os.path.abspath(__file__)), "test_image", "Jelly-Beans.yuy2"
315+
)
316+
png_filename = os.path.join(
317+
os.path.dirname(os.path.abspath(__file__)), "test_image", "Jelly-Beans.yuy2.png"
318+
)
319+
png = tf.image.decode_png(tf.io.read_file(png_filename))
320+
321+
contents = tf.io.read_file(filename)
322+
rgb = tfio.experimental.image.decode_yuy2(contents, size=[256, 256])
323+
assert rgb.dtype == tf.uint8
324+
assert rgb.shape == [256, 256, 3]
325+
assert np.all(rgb == png)
326+
327+
311328
if __name__ == "__main__":
312329
test.main()

third_party/libyuv.BUILD

+1
Original file line numberDiff line numberDiff line change
@@ -13,6 +13,7 @@ cc_library(
1313
"source/scale_*.cc",
1414
]) + [
1515
"source/convert_argb.cc",
16+
"source/convert_from_argb.cc",
1617
"source/cpu_id.cc",
1718
"source/planar_functions.cc",
1819
],

0 commit comments

Comments
 (0)