ComputeLibrary/latest/_assets_library_8cpp_source.xhtml

/*

 * Copyright (c) 2017-2020, 2023 Arm Limited.

 *

 * SPDX-License-Identifier: MIT

 *

 * Permission is hereby granted, free of charge, to any person obtaining a copy

 * of this software and associated documentation files (the "Software"), to

 * deal in the Software without restriction, including without limitation the

 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or

 * sell copies of the Software, and to permit persons to whom the Software is

 * furnished to do so, subject to the following conditions:

 *

 * The above copyright notice and this permission notice shall be included in all

 * copies or substantial portions of the Software.

 *

 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR

 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,

 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE

 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER

 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,

 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE

 * SOFTWARE.

 */

#include "tests/AssetsLibrary.h"


#include "Utils.h"

#include "utils/TypePrinter.h"


#include "arm_compute/core/ITensor.h"


#pragma GCC diagnostic push

#pragma GCC diagnostic ignored "-Wunused-parameter"

#include "libnpy/npy.hpp"

#pragma GCC diagnostic pop


#include <cctype>

#include <fstream>

#include <limits>

#include <map>

#include <mutex>

#include <sstream>

#include <stdexcept>

#include <tuple>

#include <unordered_map>

#include <utility>


namespace arm_compute

{

namespace test

{

namespace

{

template <typename T, typename std::enable_if<std::is_integral<T>::value, int>::type = 0>

void rgb_to_luminance(const RawTensor &src, RawTensor &dst)

{

    // Ensure in/out tensors have same image dimensions (independent of element size and number of channels)

    ARM_COMPUTE_ERROR_ON_MSG(src.num_elements() != dst.num_elements(), "Input and output images must have equal dimensions");


    const size_t num_elements = dst.num_elements();


    // Currently, input is always RGB888 (3 U8 channels per element). Output can be U8, U16/S16 or U32

    // Note that src.data()[i] returns pointer to first channel of element[i], so RGB values have [0,1,2] offsets

    for(size_t i = 0, j = 0; j < num_elements; i += 3, ++j)

    {

        reinterpret_cast<T *>(dst.data())[j] = 0.2126f * src.data()[i] + 0.7152f * src.data()[i + 1] + 0.0722f * src.data()[i + 2];

    }

}


void extract_r_from_rgb(const RawTensor &src, RawTensor &dst)

{

    ARM_COMPUTE_ERROR_ON(src.size() != 3 * dst.size());


    const size_t num_elements = dst.num_elements();


    for(size_t i = 0, j = 0; j < num_elements; i += 3, ++j)

    {

        dst.data()[j] = src.data()[i];

    }

}


void extract_g_from_rgb(const RawTensor &src, RawTensor &dst)

{

    ARM_COMPUTE_ERROR_ON(src.size() != 3 * dst.size());


    const size_t num_elements = dst.num_elements();


    for(size_t i = 1, j = 0; j < num_elements; i += 3, ++j)

    {

        dst.data()[j] = src.data()[i];

    }

}


void extract_b_from_rgb(const RawTensor &src, RawTensor &dst)

{

    ARM_COMPUTE_ERROR_ON(src.size() != 3 * dst.size());


    const size_t num_elements = dst.num_elements();


    for(size_t i = 2, j = 0; j < num_elements; i += 3, ++j)

    {

        dst.data()[j] = src.data()[i];

    }

}


void discard_comments(std::ifstream &fs)

{

    while(fs.peek() == '#')

    {

        fs.ignore(std::numeric_limits<std::streamsize>::max(), '\n');

    }

}


void discard_comments_and_spaces(std::ifstream &fs)

{

    while(true)

    {

        discard_comments(fs);


        if(isspace(fs.peek()) == 0)

        {

            break;

        }


        fs.ignore(1);

    }

}


std::tuple<unsigned int, unsigned int, int> parse_netpbm_format_header(std::ifstream &fs, char number)

{

    // check file type magic number is valid

    std::array<char, 2> magic_number{ { 0 } };

    fs >> magic_number[0] >> magic_number[1];


    if(magic_number[0] != 'P' || magic_number[1] != number)

    {

        throw std::runtime_error("File type magic number not supported");

    }


    discard_comments_and_spaces(fs);


    unsigned int width = 0;

    fs >> width;


    discard_comments_and_spaces(fs);


    unsigned int height = 0;

    fs >> height;


    discard_comments_and_spaces(fs);


    int max_value = 0;

    fs >> max_value;


    if(!fs.good())

    {

        throw std::runtime_error("Cannot read image dimensions");

    }


    if(max_value != 255)

    {

        throw std::runtime_error("RawTensor doesn't have 8-bit values");

    }


    discard_comments(fs);


    if(isspace(fs.peek()) == 0)

    {

        throw std::runtime_error("Invalid image header");

    }


    fs.ignore(1);


    return std::make_tuple(width, height, max_value);

}


std::tuple<unsigned int, unsigned int, int> parse_ppm_header(std::ifstream &fs)

{

    return parse_netpbm_format_header(fs, '6');

}


std::tuple<unsigned int, unsigned int, int> parse_pgm_header(std::ifstream &fs)

{

    return parse_netpbm_format_header(fs, '5');

}


void check_image_size(std::ifstream &fs, size_t raw_size)

{

    const size_t current_position = fs.tellg();

    fs.seekg(0, std::ios_base::end);

    const size_t end_position = fs.tellg();

    fs.seekg(current_position, std::ios_base::beg);


    if((end_position - current_position) < raw_size)

    {

        throw std::runtime_error("Not enough data in file");

    }

}


void read_image_buffer(std::ifstream &fs, RawTensor &raw)

{

    fs.read(reinterpret_cast<std::fstream::char_type *>(raw.data()), raw.size());


    if(!fs.good())

    {

        throw std::runtime_error("Failure while reading image buffer");

    }

}


RawTensor load_ppm(const std::string &path)

{

    std::ifstream file(path, std::ios::in | std::ios::binary);


    if(!file.good())

    {

        throw framework::FileNotFound("Could not load PPM image: " + path);

    }


    unsigned int width  = 0;

    unsigned int height = 0;


    std::tie(width, height, std::ignore) = parse_ppm_header(file);


    RawTensor raw(TensorShape(width, height), Format::RGB888);


    check_image_size(file, raw.size());

    read_image_buffer(file, raw);


    return raw;

}


RawTensor load_pgm(const std::string &path)

{

    std::ifstream file(path, std::ios::in | std::ios::binary);


    if(!file.good())

    {

        throw framework::FileNotFound("Could not load PGM image: " + path);

    }


    unsigned int width  = 0;

    unsigned int height = 0;


    std::tie(width, height, std::ignore) = parse_pgm_header(file);


    RawTensor raw(TensorShape(width, height), Format::U8);


    check_image_size(file, raw.size());

    read_image_buffer(file, raw);


    return raw;

}

} // namespace


AssetsLibrary::AssetsLibrary(std::string path, std::random_device::result_type seed) //NOLINT

    : _library_path(std::move(path)),

      _seed{ seed }

{

}


std::string AssetsLibrary::path() const

{

    return _library_path;

}


std::random_device::result_type AssetsLibrary::seed() const

{

    return _seed;

}


void AssetsLibrary::fill(RawTensor &raw, const std::string &name, Format format) const

{

    //FIXME: Should be done by swapping cached buffers

    const RawTensor &src = get(name, format);

    std::copy_n(src.data(), raw.size(), raw.data());

}


void AssetsLibrary::fill(RawTensor &raw, const std::string &name, Channel channel) const

{

    fill(raw, name, get_format_for_channel(channel), channel);

}


void AssetsLibrary::fill(RawTensor &raw, const std::string &name, Format format, Channel channel) const

{

    const RawTensor &src = get(name, format, channel);

    std::copy_n(src.data(), raw.size(), raw.data());

}


const AssetsLibrary::Loader &AssetsLibrary::get_loader(const std::string &extension) const

{

    static std::unordered_map<std::string, Loader> loaders =

    {

        { "ppm", load_ppm },

        { "pgm", load_pgm }

    };


    const auto it = loaders.find(extension);


    if(it != loaders.end())

    {

        return it->second;

    }

    else

    {

        throw std::invalid_argument("Cannot load image with extension '" + extension + "'");

    }

}


const AssetsLibrary::Converter &AssetsLibrary::get_converter(Format src, Format dst) const

{

    static std::map<std::pair<Format, Format>, Converter> converters =

    {

        { std::make_pair(Format::RGB888, Format::U8), rgb_to_luminance<uint8_t> },

        { std::make_pair(Format::RGB888, Format::U16), rgb_to_luminance<uint16_t> },

        { std::make_pair(Format::RGB888, Format::S16), rgb_to_luminance<int16_t> },

        { std::make_pair(Format::RGB888, Format::U32), rgb_to_luminance<uint32_t> }

    };


    const auto it = converters.find(std::make_pair(src, dst));


    if(it != converters.end())

    {

        return it->second;

    }

    else

    {

        std::stringstream msg;

        msg << "Cannot convert from format '" << src << "' to format '" << dst << "'\n";

        throw std::invalid_argument(msg.str());

    }

}


const AssetsLibrary::Converter &AssetsLibrary::get_converter(DataType src, Format dst) const

{

    static std::map<std::pair<DataType, Format>, Converter> converters = {};


    const auto it = converters.find(std::make_pair(src, dst));


    if(it != converters.end())

    {

        return it->second;

    }

    else

    {

        std::stringstream msg;

        msg << "Cannot convert from data type '" << src << "' to format '" << dst << "'\n";

        throw std::invalid_argument(msg.str());

    }

}


const AssetsLibrary::Converter &AssetsLibrary::get_converter(DataType src, DataType dst) const

{

    static std::map<std::pair<DataType, DataType>, Converter> converters = {};


    const auto it = converters.find(std::make_pair(src, dst));


    if(it != converters.end())

    {

        return it->second;

    }

    else

    {

        std::stringstream msg;

        msg << "Cannot convert from data type '" << src << "' to data type '" << dst << "'\n";

        throw std::invalid_argument(msg.str());

    }

}


const AssetsLibrary::Converter &AssetsLibrary::get_converter(Format src, DataType dst) const

{

    static std::map<std::pair<Format, DataType>, Converter> converters = {};


    const auto it = converters.find(std::make_pair(src, dst));


    if(it != converters.end())

    {

        return it->second;

    }

    else

    {

        std::stringstream msg;

        msg << "Cannot convert from format '" << src << "' to data type '" << dst << "'\n";

        throw std::invalid_argument(msg.str());

    }

}


const AssetsLibrary::Extractor &AssetsLibrary::get_extractor(Format format, Channel channel) const

{

    static std::map<std::pair<Format, Channel>, Extractor> extractors =

    {

        { std::make_pair(Format::RGB888, Channel::R), extract_r_from_rgb },

        { std::make_pair(Format::RGB888, Channel::G), extract_g_from_rgb },

        { std::make_pair(Format::RGB888, Channel::B), extract_b_from_rgb }

    };


    const auto it = extractors.find(std::make_pair(format, channel));


    if(it != extractors.end())

    {

        return it->second;

    }

    else

    {

        std::stringstream msg;

        msg << "Cannot extract channel '" << channel << "' from format '" << format << "'\n";

        throw std::invalid_argument(msg.str());

    }

}


RawTensor AssetsLibrary::load_image(const std::string &name) const

{

#ifdef _WIN32

    const std::string image_path = ("\\images\\");

#else  /* _WIN32 */

    const std::string image_path = ("/images/");

#endif /* _WIN32 */


    const std::string path      = _library_path + image_path + name;

    const std::string extension = path.substr(path.find_last_of('.') + 1);

    return (*get_loader(extension))(path);

}


const RawTensor &AssetsLibrary::find_or_create_raw_tensor(const std::string &name, Format format) const

{

    std::lock_guard<arm_compute::Mutex> guard(_format_lock);


    const RawTensor *ptr = _cache.find(std::forward_as_tuple(name, format));


    if(ptr != nullptr)

    {

        return *ptr;

    }


    RawTensor raw = load_image(name);


    if(raw.format() != format)

    {

        //FIXME: Remove unnecessary copy

        RawTensor dst(raw.shape(), format);

        (*get_converter(raw.format(), format))(raw, dst);

        raw = std::move(dst);

    }


    return _cache.add(std::forward_as_tuple(name, format), std::move(raw));

}


const RawTensor &AssetsLibrary::find_or_create_raw_tensor(const std::string &name, Format format, Channel channel) const

{

    std::lock_guard<arm_compute::Mutex> guard(_channel_lock);


    const RawTensor *ptr = _cache.find(std::forward_as_tuple(name, format, channel));


    if(ptr != nullptr)

    {

        return *ptr;

    }


    const RawTensor &src = get(name, format);

    //FIXME: Need to change shape to match channel

    RawTensor dst(src.shape(), get_channel_format(channel));


    (*get_extractor(format, channel))(src, dst);


    return _cache.add(std::forward_as_tuple(name, format, channel), std::move(dst));

}


TensorShape AssetsLibrary::get_image_shape(const std::string &name)

{

    return load_image(name).shape();

}


const RawTensor &AssetsLibrary::get(const std::string &name) const

{

    //FIXME: Format should be derived from the image name. Not be fixed to RGB.

    return find_or_create_raw_tensor(name, Format::RGB888);

}


RawTensor AssetsLibrary::get(const std::string &name)

{

    //FIXME: Format should be derived from the image name. Not be fixed to RGB.

    return RawTensor(find_or_create_raw_tensor(name, Format::RGB888));

}


RawTensor AssetsLibrary::get(const std::string &name, DataType data_type, int num_channels) const

{

    const RawTensor &raw = get(name);


    return RawTensor(raw.shape(), data_type, num_channels);

}


const RawTensor &AssetsLibrary::get(const std::string &name, Format format) const

{

    return find_or_create_raw_tensor(name, format);

}


RawTensor AssetsLibrary::get(const std::string &name, Format format)

{

    return RawTensor(find_or_create_raw_tensor(name, format));

}


const RawTensor &AssetsLibrary::get(const std::string &name, Channel channel) const

{

    return get(name, get_format_for_channel(channel), channel);

}


RawTensor AssetsLibrary::get(const std::string &name, Channel channel)

{

    return RawTensor(get(name, get_format_for_channel(channel), channel));

}


const RawTensor &AssetsLibrary::get(const std::string &name, Format format, Channel channel) const

{

    return find_or_create_raw_tensor(name, format, channel);

}


RawTensor AssetsLibrary::get(const std::string &name, Format format, Channel channel)

{

    return RawTensor(find_or_create_raw_tensor(name, format, channel));

}


namespace detail

{

inline void validate_npy_header(std::ifstream &stream, const std::string &expect_typestr, const TensorShape &expect_shape)

{

    ARM_COMPUTE_UNUSED(expect_typestr);

    ARM_COMPUTE_UNUSED(expect_shape);


    std::string header_s = npy::read_header(stream);


    // Parse header

    npy::header_t header = npy::parse_header(header_s);


    std::vector<unsigned long> shape         = header.shape;

    bool                       fortran_order = header.fortran_order;

    std::string                typestr       = header.dtype.str();


    // Check if the typestring matches the given one

    ARM_COMPUTE_ERROR_ON_MSG(typestr != expect_typestr, "Typestrings mismatch");


    // Validate tensor shape

    ARM_COMPUTE_ERROR_ON_MSG(shape.size() != expect_shape.num_dimensions(), "Tensor ranks mismatch");

    if(fortran_order)

    {

        for(size_t i = 0; i < shape.size(); ++i)

        {

            ARM_COMPUTE_ERROR_ON_MSG(expect_shape[i] != shape[i], "Tensor dimensions mismatch");

        }

    }

    else

    {

        for(size_t i = 0; i < shape.size(); ++i)

        {

            ARM_COMPUTE_ERROR_ON_MSG(expect_shape[i] != shape[shape.size() - i - 1], "Tensor dimensions mismatch");

        }

    }

}

} // namespace detail

} // namespace test

} // namespace arm_compute