/*
    Copyright (C) 2018 Matthias P. Braendli (http://opendigitalradio.org)

    This program is free software: you can redistribute it and/or modify
    it under the terms of the GNU General Public License as published by
    the Free Software Foundation, either version 3 of the License, or
    (at your option) any later version.

    This program is distributed in the hope that it will be useful,
    but WITHOUT ANY WARRANTY; without even the implied warranty of
    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
    GNU General Public License for more details.

    You should have received a copy of the GNU General Public License
    along with this program.  If not, see <http://www.gnu.org/licenses/>.
*/
/*!
    \file charset.h
    \brief A converter for UTF-8 to EBU Latin charset according to
           ETSI TS 101 756 Annex C, used for DLS and Labels.

    \author Matthias P. Braendli
    \author Lindsay Cornell
*/

#pragma once

#include <cstdint>
#include <string>
#include <vector>
#include "utf8.h"

class CharsetConverter
{
    public:
        CharsetConverter();

        /*! Convert a UTF-8 encoded text line into an EBU Latin encoded byte
         *  stream. If up_to_first_error is set, convert as much text as possible.
         *  If false, raise an utf8::exception in case of conversion errors.
         */
        std::string convert(std::string line_utf8, bool up_to_first_error = true);

        /*! Convert a EBU Latin byte stream to a UTF-8 encoded string.
         *  Invalid input characters are converted to ⁇ (unicode U+2047).
         */
        std::string convert_ebu_to_utf8(const std::string& str);

    private:
        // Representation of the table in 32-bit unicode
        std::vector<uint32_t> m_conversion_table;
};