wordbreakdef.h

Go to the documentation of this file.
00001 /* vim: set tabstop=4 shiftwidth=4: */
00002 
00003 /*
00004  * Word breaking in a Unicode sequence.  Designed to be used in a
00005  * generic text renderer.
00006  *
00007  * Copyright (C) 2012 Tom Hacohen <tom@stosb.com>
00008  *
00009  * This software is provided 'as-is', without any express or implied
00010  * warranty.  In no event will the author be held liable for any damages
00011  * arising from the use of this software.
00012  *
00013  * Permission is granted to anyone to use this software for any purpose,
00014  * including commercial applications, and to alter it and redistribute
00015  * it freely, subject to the following restrictions:
00016  *
00017  * 1. The origin of this software must not be misrepresented; you must
00018  *    not claim that you wrote the original software.  If you use this
00019  *    software in a product, an acknowledgement in the product
00020  *    documentation would be appreciated but is not required.
00021  * 2. Altered source versions must be plainly marked as such, and must
00022  *    not be misrepresented as being the original software.
00023  * 3. This notice may not be removed or altered from any source
00024  *    distribution.
00025  *
00026  * The main reference is Unicode Standard Annex 29 (UAX #29):
00027  *      <URL:http://unicode.org/reports/tr29>
00028  *
00029  * When this library was designed, this annex was at Revision 17, for
00030  * Unicode 6.0.0:
00031  *      <URL:http://www.unicode.org/reports/tr29/tr29-17.html>
00032  *
00033  * The Unicode Terms of Use are available at
00034  *      <URL:http://www.unicode.org/copyright.html>
00035  */
00036 
00051 enum WordBreakClass
00052 {
00053    WBP_Undefined,
00054    WBP_CR,
00055    WBP_LF,
00056    WBP_Newline,
00057    WBP_Extend,
00058    WBP_Format,
00059    WBP_Katakana,
00060    WBP_ALetter,
00061    WBP_MidNumLet,
00062    WBP_MidLetter,
00063    WBP_MidNum,
00064    WBP_Numeric,
00065    WBP_ExtendNumLet,
00066    WBP_Any
00067 };
00068 
00073 struct WordBreakProperties
00074 {
00075     utf32_t start;              
00076     utf32_t end;                
00077     enum WordBreakClass prop;   
00078 };

Generated on Sat Aug 11 14:59:20 2012 for libunibreak by  doxygen 1.5.2