88 lines
2.8 KiB

/* vim: set tabstop=4 shiftwidth=4: */
* Line breaking in a Unicode sequence. Designed to be used in a
* generic text renderer.
* Copyright (C) 2008-2010 Wu Yongwei <wuyongwei at gmail dot com>
* This software is provided 'as-is', without any express or implied
* warranty. In no event will the author be held liable for any damages
* arising from the use of this software.
* Permission is granted to anyone to use this software for any purpose,
* including commercial applications, and to alter it and redistribute
* it freely, subject to the following restrictions:
* 1. The origin of this software must not be misrepresented; you must
* not claim that you wrote the original software. If you use this
* software in a product, an acknowledgement in the product
* documentation would be appreciated but is not required.
* 2. Altered source versions must be plainly marked as such, and must
* not be misrepresented as being the original software.
* 3. This notice may not be removed or altered from any source
* distribution.
* The main reference is Unicode Standard Annex 14 (UAX #14):
* <URL:http://www.unicode.org/reports/tr14/>
* When this library was designed, this annex was at Revision 19, for
* Unicode 5.0.0:
* <URL:http://www.unicode.org/reports/tr14/tr14-19.html>
* This library has been updated according to Revision 24, for
* Unicode 5.2.0:
* <URL:http://www.unicode.org/reports/tr14/tr14-24.html>
* The Unicode Terms of Use are available at
* <URL:http://www.unicode.org/copyright.html>
* @file linebreak.h
* Header file for the line breaking algorithm.
* @version 2.0, 2010/01/03
* @author Wu Yongwei
#include <stddef.h>
#ifdef __cplusplus
extern "C" {
#define LINEBREAK_VERSION 0x0200 /**< Version of the library linebreak */
extern const int linebreak_version;
typedef unsigned char utf8_t; /**< Type for UTF-8 data points */
typedef unsigned short utf16_t; /**< Type for UTF-16 data points */
typedef unsigned int utf32_t; /**< Type for UTF-32 data points */
#define LINEBREAK_MUSTBREAK 0 /**< Break is mandatory */
#define LINEBREAK_ALLOWBREAK 1 /**< Break is allowed */
#define LINEBREAK_NOBREAK 2 /**< No break is possible */
#define LINEBREAK_INSIDEACHAR 3 /**< A UTF-8/16 sequence is unfinished */
void init_linebreak(void);
void set_linebreaks_utf8(
const utf8_t *s, size_t len, const char* lang, char *brks);
void set_linebreaks_utf16(
const utf16_t *s, size_t len, const char* lang, char *brks);
void set_linebreaks_utf32(
const utf32_t *s, size_t len, const char* lang, char *brks);
int is_line_breakable(utf32_t char1, utf32_t char2, const char* lang);
#ifdef __cplusplus
#endif /* LINEBREAK_H */