libosmscout 1.1.1
Loading...
Searching...
No Matches
utf8helper Namespace Reference

Classes

struct  Parser
 Parse and transform an UTF8 string. More...
class  UTF8String
struct  character

Typedefs

using Transform = codepoint (*)(const character*, int context)
 functor implements desired transformation of the character It has 2 arguments:
using byte = uint8_t
using codepoint = uint32_t

Functions

std::string UTF8ToUpper (const std::string &text)
std::string UTF8ToLower (const std::string &text)
std::string UTF8Normalize (const std::string &text)
std::string UTF8Capitalize (const std::string &text)
std::string UTF8Transliterate (const std::string &text)
codepoint TransformNop (const character *, int)
codepoint TransformUpper (const character *, int)
codepoint TransformLower (const character *, int)
codepoint TransformCapitalize (const character *, int)
codepoint TransformNormalize (const character *, int)
codepoint TransformTransliterate (const character *, int)

Variables

constexpr int None = 0x00
constexpr int IsSpace = 0x01
constexpr int IsBreaker = 0x02
constexpr int IsControl = 0x04
constexpr int IsModifier = 0x08
constexpr int IsDiacritic = 0x10
constexpr int IsPunctuation = 0x20
constexpr codepoint NullCodepoint = 0
const character charmap_us7ascii []
const characterpagemap_16 [32]
const character charmap_c2 []
const character charmap_c3 []
const character charmap_c4 []
const character charmap_c5 []
const character charmap_c6 []
const character charmap_c7 []
const character charmap_c8 []
const character charmap_c9 []
const character charmap_ca []
const character charmap_cb []
const character charmap_cc []
const character charmap_cd []
const character charmap_ce []
const character charmap_cf []
const character charmap_d0 []
const character charmap_d1 []
const character charmap_d2 []
const character charmap_d3 []
const character charmap_d4 []
const character charmap_d5 []
const character charmap_d6 []
const characterpagemap_24_e1 []
const character charmap_e1_82 []
const character charmap_e1_83 []
const character charmap_e1_b8 []
const character charmap_e1_b9 []
const character charmap_e1_ba []
const character charmap_e1_bb []
const character charmap_e1_bc []
const character charmap_e1_bd []
const character charmap_e1_be []
const character charmap_e1_bf []
const characterpagemap_24_e2 []
const character charmap_e2_80 []
const character charmap_e2_81 []
const character charmap_e2_82 []
const character charmap_e2_b4 []
const characterpagemap_32_f0_90 []
const character charmap_f0_90_92 []
const character charmap_f0_90_93 []
const characterpagemap_32_f0_9e []
const character charmap_f0_9e_a4 []

Typedef Documentation

◆ byte

using utf8helper::byte = uint8_t

◆ codepoint

using utf8helper::codepoint = uint32_t

◆ Transform

using utf8helper::Transform = codepoint (*)(const character*, int context)

functor implements desired transformation of the character It has 2 arguments:

  • The character struct matching the current code point
  • The context, it is the category of the preceding sequence It must return the new code point to be dumped instead, or NullCodepoint to discard the sequence.

Function Documentation

◆ TransformCapitalize()

codepoint utf8helper::TransformCapitalize ( const character * ,
int  )
extern

◆ TransformLower()

codepoint utf8helper::TransformLower ( const character * ,
int  )
extern

◆ TransformNop()

codepoint utf8helper::TransformNop ( const character * ,
int  )
extern

◆ TransformNormalize()

codepoint utf8helper::TransformNormalize ( const character * ,
int  )
extern

◆ TransformTransliterate()

codepoint utf8helper::TransformTransliterate ( const character * ,
int  )
extern

◆ TransformUpper()

codepoint utf8helper::TransformUpper ( const character * ,
int  )
extern

◆ UTF8Capitalize()

std::string utf8helper::UTF8Capitalize ( const std::string & text)
extern

◆ UTF8Normalize()

std::string utf8helper::UTF8Normalize ( const std::string & text)
extern

◆ UTF8ToLower()

std::string utf8helper::UTF8ToLower ( const std::string & text)
extern

◆ UTF8ToUpper()

std::string utf8helper::UTF8ToUpper ( const std::string & text)
extern

◆ UTF8Transliterate()

std::string utf8helper::UTF8Transliterate ( const std::string & text)
extern

Variable Documentation

◆ charmap_c2

const character utf8helper::charmap_c2[]
extern

◆ charmap_c3

const character utf8helper::charmap_c3[]
extern

◆ charmap_c4

const character utf8helper::charmap_c4[]
extern

◆ charmap_c5

const character utf8helper::charmap_c5[]
extern

◆ charmap_c6

const character utf8helper::charmap_c6[]
extern

◆ charmap_c7

const character utf8helper::charmap_c7[]
extern

◆ charmap_c8

const character utf8helper::charmap_c8[]
extern

◆ charmap_c9

const character utf8helper::charmap_c9[]
extern

◆ charmap_ca

const character utf8helper::charmap_ca[]
extern

◆ charmap_cb

const character utf8helper::charmap_cb[]
extern

◆ charmap_cc

const character utf8helper::charmap_cc[]
extern

◆ charmap_cd

const character utf8helper::charmap_cd[]
extern

◆ charmap_ce

const character utf8helper::charmap_ce[]
extern

◆ charmap_cf

const character utf8helper::charmap_cf[]
extern

◆ charmap_d0

const character utf8helper::charmap_d0[]
extern

◆ charmap_d1

const character utf8helper::charmap_d1[]
extern

◆ charmap_d2

const character utf8helper::charmap_d2[]
extern

◆ charmap_d3

const character utf8helper::charmap_d3[]
extern

◆ charmap_d4

const character utf8helper::charmap_d4[]
extern

◆ charmap_d5

const character utf8helper::charmap_d5[]
extern

◆ charmap_d6

const character utf8helper::charmap_d6[]
extern

◆ charmap_e1_82

const character utf8helper::charmap_e1_82[]
extern

◆ charmap_e1_83

const character utf8helper::charmap_e1_83[]
extern

◆ charmap_e1_b8

const character utf8helper::charmap_e1_b8[]
extern

◆ charmap_e1_b9

const character utf8helper::charmap_e1_b9[]
extern

◆ charmap_e1_ba

const character utf8helper::charmap_e1_ba[]
extern

◆ charmap_e1_bb

const character utf8helper::charmap_e1_bb[]
extern

◆ charmap_e1_bc

const character utf8helper::charmap_e1_bc[]
extern

◆ charmap_e1_bd

const character utf8helper::charmap_e1_bd[]
extern

◆ charmap_e1_be

const character utf8helper::charmap_e1_be[]
extern

◆ charmap_e1_bf

const character utf8helper::charmap_e1_bf[]
extern

◆ charmap_e2_80

const character utf8helper::charmap_e2_80[]
extern

◆ charmap_e2_81

const character utf8helper::charmap_e2_81[]
extern

◆ charmap_e2_82

const character utf8helper::charmap_e2_82[]
extern

◆ charmap_e2_b4

const character utf8helper::charmap_e2_b4[]
extern

◆ charmap_f0_90_92

const character utf8helper::charmap_f0_90_92[]
extern

◆ charmap_f0_90_93

const character utf8helper::charmap_f0_90_93[]
extern

◆ charmap_f0_9e_a4

const character utf8helper::charmap_f0_9e_a4[]
extern

◆ charmap_us7ascii

const character utf8helper::charmap_us7ascii[]
extern

◆ IsBreaker

int utf8helper::IsBreaker = 0x02
constexpr

◆ IsControl

int utf8helper::IsControl = 0x04
constexpr

◆ IsDiacritic

int utf8helper::IsDiacritic = 0x10
constexpr

◆ IsModifier

int utf8helper::IsModifier = 0x08
constexpr

◆ IsPunctuation

int utf8helper::IsPunctuation = 0x20
constexpr

◆ IsSpace

int utf8helper::IsSpace = 0x01
constexpr

◆ None

int utf8helper::None = 0x00
constexpr

◆ NullCodepoint

codepoint utf8helper::NullCodepoint = 0
constexpr

◆ pagemap_16

const character* utf8helper::pagemap_16[32]
extern

◆ pagemap_24_e1

const character* utf8helper::pagemap_24_e1[]
extern

◆ pagemap_24_e2

const character* utf8helper::pagemap_24_e2[]
extern

◆ pagemap_32_f0_90

const character* utf8helper::pagemap_32_f0_90[]
extern

◆ pagemap_32_f0_9e

const character* utf8helper::pagemap_32_f0_9e[]
extern