2018-12-31 20:04:05 +01:00
|
|
|
//
|
2022-12-31 22:28:08 +01:00
|
|
|
// Copyright Aliaksei Levin (levlam@telegram.org), Arseny Smirnov (arseny30@gmail.com) 2014-2023
|
2018-12-31 20:04:05 +01:00
|
|
|
//
|
|
|
|
// Distributed under the Boost Software License, Version 1.0. (See accompanying
|
|
|
|
// file LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt)
|
|
|
|
//
|
|
|
|
#pragma once
|
|
|
|
|
|
|
|
#include "td/utils/common.h"
|
|
|
|
|
|
|
|
namespace td {
|
|
|
|
|
|
|
|
enum class UnicodeSimpleCategory { Unknown, Letter, DecimalNumber, Number, Separator };
|
|
|
|
|
|
|
|
UnicodeSimpleCategory get_unicode_simple_category(uint32 code);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Prepares unicode character for search, leaving only digits and lowercased letters.
|
2022-09-27 13:16:09 +02:00
|
|
|
* Returns code of replacing character or 0 if the character should be skipped.
|
2018-12-31 20:04:05 +01:00
|
|
|
*/
|
|
|
|
uint32 prepare_search_character(uint32 code);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Converts unicode character to lower case.
|
|
|
|
*/
|
|
|
|
uint32 unicode_to_lower(uint32 code);
|
|
|
|
|
2018-07-31 17:42:27 +02:00
|
|
|
/**
|
|
|
|
* Removes diacritics from a unicode character.
|
|
|
|
*/
|
|
|
|
uint32 remove_diacritics(uint32 code);
|
|
|
|
|
2018-12-31 20:04:05 +01:00
|
|
|
} // namespace td
|