-
Notifications
You must be signed in to change notification settings - Fork 7k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Reviewed By: vmoens Differential Revision: D57099453 fbshipit-source-id: 0e85ec0c92cc4e2ee06b5d4183fedc639f38dec0
- Loading branch information
1 parent
564eec7
commit 183aba1
Showing
22 changed files
with
2,644 additions
and
24 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -19,6 +19,7 @@ Images | |
encode_jpeg | ||
decode_jpeg | ||
write_jpeg | ||
decode_gif | ||
encode_png | ||
decode_png | ||
write_png | ||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,157 @@ | ||
#include "decode_gif.h" | ||
#include <cstring> | ||
#include "giflib/gif_lib.h" | ||
|
||
namespace vision { | ||
namespace image { | ||
|
||
typedef struct reader_helper_t { | ||
uint8_t const* encoded_data; // input tensor data pointer | ||
size_t encoded_data_size; // size of input tensor in bytes | ||
size_t num_bytes_read; // number of bytes read so far in the tensor | ||
} reader_helper_t; | ||
|
||
// That function is used by GIFLIB routines to read the encoded bytes. | ||
// This reads `len` bytes and writes them into `buf`. The data is read from the | ||
// input tensor passed to decode_gif() starting at the `num_bytes_read` | ||
// position. | ||
int read_from_tensor(GifFileType* gifFile, GifByteType* buf, int len) { | ||
// the UserData field was set in DGifOpen() | ||
reader_helper_t* reader_helper = | ||
static_cast<reader_helper_t*>(gifFile->UserData); | ||
|
||
size_t num_bytes_to_read = std::min( | ||
(size_t)len, | ||
reader_helper->encoded_data_size - reader_helper->num_bytes_read); | ||
std::memcpy( | ||
buf, reader_helper->encoded_data + reader_helper->num_bytes_read, len); | ||
reader_helper->num_bytes_read += num_bytes_to_read; | ||
return num_bytes_to_read; | ||
} | ||
|
||
torch::Tensor decode_gif(const torch::Tensor& encoded_data) { | ||
// LibGif docs: https://giflib.sourceforge.net/intro.html | ||
// Refer over there for more details on the libgif API, API ref, and a | ||
// detailed description of the GIF format. | ||
|
||
TORCH_CHECK(encoded_data.is_contiguous(), "Input tensor must be contiguous."); | ||
TORCH_CHECK( | ||
encoded_data.dtype() == torch::kU8, | ||
"Input tensor must have uint8 data type, got ", | ||
encoded_data.dtype()); | ||
TORCH_CHECK( | ||
encoded_data.dim() == 1, | ||
"Input tensor must be 1-dimensional, got ", | ||
encoded_data.dim(), | ||
" dims."); | ||
|
||
int error = D_GIF_SUCCEEDED; | ||
|
||
// We're using DGidOpen. The other entrypoints of libgif are | ||
// DGifOpenFileName and DGifOpenFileHandle but we don't want to use those, | ||
// since we need to read the encoded bytes from a tensor of encoded bytes, not | ||
// from a file (for consistency with existing jpeg and png decoders). Using | ||
// DGifOpen is the only way to read from a custom source. | ||
// For that we need to provide a reader function `read_from_tensor` that | ||
// reads from the tensor, and we have to keep track of the number of bytes | ||
// read so far: this is why we need the reader_helper struct. | ||
|
||
// TODO: We are potentially doing an unnecessary copy of the encoded bytes: | ||
// - 1 copy in from file to tensor (in read_file()) | ||
// - 1 copy from tensor to GIFLIB buffers (in read_from_tensor()) | ||
// Since we're vendoring GIFLIB we can potentially modify the calls to | ||
// InternalRead() and just set the `buf` pointer to the tensor data directly. | ||
// That might even save allocation of those buffers. | ||
// If we do that, we'd have to make sure the buffers are never written to by | ||
// GIFLIB, otherwise we'd be overridding the tensor data. | ||
reader_helper_t reader_helper; | ||
reader_helper.encoded_data = encoded_data.data_ptr<uint8_t>(); | ||
reader_helper.encoded_data_size = encoded_data.numel(); | ||
reader_helper.num_bytes_read = 0; | ||
GifFileType* gifFile = | ||
DGifOpen(static_cast<void*>(&reader_helper), read_from_tensor, &error); | ||
|
||
TORCH_CHECK( | ||
(gifFile != nullptr) && (error == D_GIF_SUCCEEDED), | ||
"DGifOpenFileName() failed - ", | ||
error); | ||
|
||
if (DGifSlurp(gifFile) == GIF_ERROR) { | ||
auto gifFileError = gifFile->Error; | ||
DGifCloseFile(gifFile, &error); | ||
TORCH_CHECK(false, "DGifSlurp() failed - ", gifFileError); | ||
} | ||
auto num_images = gifFile->ImageCount; | ||
|
||
// This check should already done within DGifSlurp(), just to be safe | ||
TORCH_CHECK(num_images > 0, "GIF file should contain at least one image!"); | ||
|
||
// Note: | ||
// The GIF format has this notion of "canvas" and "canvas size", where each | ||
// image could be displayed on the canvas at different offsets, forming a | ||
// mosaic/picture wall like so: | ||
// | ||
// <--- canvas W ---> | ||
// ------------------------ ^ | ||
// | | | | | ||
// | img1 | img3 | | | ||
// | |------------| canvas H | ||
// |---------- | | | ||
// | img2 | img4 | | | ||
// | | | | | ||
// ------------------------ v | ||
// The GifLib docs indicate that this is mostly vestigial | ||
// (https://giflib.sourceforge.net/whatsinagif/bits_and_bytes.html), and | ||
// modern viewers ignore the canvas size as well as image offsets. Hence, | ||
// we're ignoring that too: | ||
// - We're ignoring the canvas width and height and assume that the shape of | ||
// the canvas and of all images is the shape of the first image. | ||
// - We're enforcing that all images have the same shape. | ||
// - Left and Top offsets of each image are ignored as well and assumed to be | ||
// 0. | ||
|
||
auto out_h = gifFile->SavedImages[0].ImageDesc.Height; | ||
auto out_w = gifFile->SavedImages[0].ImageDesc.Width; | ||
|
||
// We output a channels-last tensor for consistency with other image decoders. | ||
// Torchvision's resize tends to be is faster on uint8 channels-last tensors. | ||
auto options = torch::TensorOptions() | ||
.dtype(torch::kU8) | ||
.memory_format(torch::MemoryFormat::ChannelsLast); | ||
auto out = torch::empty( | ||
{int64_t(num_images), 3, int64_t(out_h), int64_t(out_w)}, options); | ||
auto out_a = out.accessor<uint8_t, 4>(); | ||
|
||
for (int i = 0; i < num_images; i++) { | ||
const SavedImage& img = gifFile->SavedImages[i]; | ||
const GifImageDesc& desc = img.ImageDesc; | ||
TORCH_CHECK( | ||
desc.Width == out_w && desc.Height == out_h, | ||
"All images in the gif should have the same dimensions."); | ||
|
||
const ColorMapObject* cmap = | ||
desc.ColorMap ? desc.ColorMap : gifFile->SColorMap; | ||
TORCH_CHECK( | ||
cmap != nullptr, | ||
"Global and local color maps are missing. This should never happen!"); | ||
|
||
for (int h = 0; h < desc.Height; h++) { | ||
for (int w = 0; w < desc.Width; w++) { | ||
auto c = img.RasterBits[h * desc.Width + w]; | ||
GifColorType rgb = cmap->Colors[c]; | ||
out_a[i][0][h][w] = rgb.Red; | ||
out_a[i][1][h][w] = rgb.Green; | ||
out_a[i][2][h][w] = rgb.Blue; | ||
} | ||
} | ||
} | ||
out = out.squeeze(0); // remove batch dim if there's only one image | ||
|
||
DGifCloseFile(gifFile, &error); | ||
TORCH_CHECK(error == D_GIF_SUCCEEDED, "DGifCloseFile() failed - ", error); | ||
|
||
return out; | ||
} | ||
|
||
} // namespace image | ||
} // namespace vision |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,12 @@ | ||
#pragma once | ||
|
||
#include <torch/types.h> | ||
|
||
namespace vision { | ||
namespace image { | ||
|
||
// encoded_data tensor must be 1D uint8 and contiguous | ||
C10_EXPORT torch::Tensor decode_gif(const torch::Tensor& encoded_data); | ||
|
||
} // namespace image | ||
} // namespace vision |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,28 @@ | ||
These files come from the GIFLIB project (https://giflib.sourceforge.net/) and | ||
are licensed under the MIT license. | ||
|
||
Some modifications have been made to the original files: | ||
- Remove use of "register" keyword in gifalloc.c for C++17 compatibility. | ||
- Declare loop variable i in DGifGetImageHeader as int instead of unsigned int. | ||
|
||
Below is the original license text from the COPYING file of the GIFLIB project: | ||
|
||
= MIT LICENSE | ||
|
||
Permission is hereby granted, free of charge, to any person obtaining a copy | ||
of this software and associated documentation files (the "Software"), to deal | ||
in the Software without restriction, including without limitation the rights | ||
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell | ||
copies of the Software, and to permit persons to whom the Software is | ||
furnished to do so, subject to the following conditions: | ||
|
||
The above copyright notice and this permission notice shall be included in | ||
all copies or substantial portions of the Software. | ||
|
||
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR | ||
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, | ||
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE | ||
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER | ||
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, | ||
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN | ||
THE SOFTWARE. |
Oops, something went wrong.