blob: 8476ee7f5db7efbfccdcf49b02c049b14e81dbeb (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
|
/*
Copyright (C) 2018 Matthias P. Braendli (http://opendigitalradio.org)
This program is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program. If not, see <http://www.gnu.org/licenses/>.
*/
/*!
\file charset.h
\brief A converter for UTF-8 to EBU Latin charset according to
ETSI TS 101 756 Annex C, used for DLS and Labels.
\author Matthias P. Braendli
\author Lindsay Cornell
*/
#pragma once
#include <cstdint>
#include <string>
#include <vector>
#include "utf8.h"
class CharsetConverter
{
public:
CharsetConverter();
/*! Convert a UTF-8 encoded text line into an EBU Latin encoded byte
* stream. If up_to_first_error is set, convert as much text as possible.
* If false, raise an utf8::exception in case of conversion errors.
*/
std::string convert(std::string line_utf8, bool up_to_first_error = true);
/*! Convert a EBU Latin byte stream to a UTF-8 encoded string.
* Invalid input characters are converted to ⁇ (unicode U+2047).
*/
std::string convert_ebu_to_utf8(const std::string& str);
private:
// Representation of the table in 32-bit unicode
std::vector<uint32_t> m_conversion_table;
};
|