blob: ac6a37ea966d8789d1b6ba55f7c45d28bdbc07fc [file] [log] [blame]
/* ctype-style APIs.
*
* Copyright (C) 2012-2018 Reece H. Dunn
*
* This file is part of ucd-tools.
*
* ucd-tools is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* ucd-tools is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with ucd-tools. If not, see <http://www.gnu.org/licenses/>.
*/
#include "ucd/ucd.h"
int ucd_isalnum(codepoint_t c)
{
ucd_category cat = ucd_lookup_category(c);
switch (cat)
{
case UCD_CATEGORY_Lu:
case UCD_CATEGORY_Ll:
case UCD_CATEGORY_Lt:
case UCD_CATEGORY_Lm:
case UCD_CATEGORY_Lo:
case UCD_CATEGORY_Nl:
case UCD_CATEGORY_Nd:
case UCD_CATEGORY_No:
return 1;
case UCD_CATEGORY_Mn:
case UCD_CATEGORY_Mc:
case UCD_CATEGORY_So:
return (ucd_properties(c, cat) & UCD_PROPERTY_OTHER_ALPHABETIC) == UCD_PROPERTY_OTHER_ALPHABETIC;
default:
return 0;
}
}
int ucd_isalpha(codepoint_t c)
{
ucd_category cat = ucd_lookup_category(c);
switch (cat)
{
case UCD_CATEGORY_Lu:
case UCD_CATEGORY_Ll:
case UCD_CATEGORY_Lt:
case UCD_CATEGORY_Lm:
case UCD_CATEGORY_Lo:
case UCD_CATEGORY_Nl:
return 1;
case UCD_CATEGORY_Mn:
case UCD_CATEGORY_Mc:
case UCD_CATEGORY_So:
return (ucd_properties(c, cat) & UCD_PROPERTY_OTHER_ALPHABETIC) == UCD_PROPERTY_OTHER_ALPHABETIC;
default:
return 0;
}
}
int ucd_isblank(codepoint_t c)
{
switch (ucd_lookup_category(c))
{
case UCD_CATEGORY_Zs:
switch (c) /* Exclude characters with the <noBreak> DispositionType */
{
case 0x00A0: /* U+00A0 : NO-BREAK SPACE */
case 0x2007: /* U+2007 : FIGURE SPACE */
case 0x202F: /* U+202F : NARROW NO-BREAK SPACE */
return 0;
}
return 1;
case UCD_CATEGORY_Cc:
return c == 0x09; /* U+0009 : CHARACTER TABULATION */
default:
return 0;
}
}
int ucd_iscntrl(codepoint_t c)
{
return ucd_lookup_category(c) == UCD_CATEGORY_Cc;
}
int ucd_isdigit(codepoint_t c)
{
return (c >= 0x30 && c <= 0x39); /* [0-9] */
}
int ucd_isgraph(codepoint_t c)
{
switch (ucd_lookup_category(c))
{
case UCD_CATEGORY_Cc:
case UCD_CATEGORY_Cf:
case UCD_CATEGORY_Cn:
case UCD_CATEGORY_Co:
case UCD_CATEGORY_Cs:
case UCD_CATEGORY_Zl:
case UCD_CATEGORY_Zp:
case UCD_CATEGORY_Zs:
case UCD_CATEGORY_Ii:
return 0;
default:
return 1;
}
}
int ucd_islower(codepoint_t c)
{
ucd_category cat = ucd_lookup_category(c);
switch (cat)
{
case UCD_CATEGORY_Ll:
return 1;
case UCD_CATEGORY_Lt:
return ucd_toupper(c) != c;
case UCD_CATEGORY_Lm:
case UCD_CATEGORY_Lo:
case UCD_CATEGORY_Mn:
case UCD_CATEGORY_Nl:
case UCD_CATEGORY_So:
return (ucd_properties(c, cat) & UCD_PROPERTY_OTHER_LOWERCASE) == UCD_PROPERTY_OTHER_LOWERCASE;
default:
return 0;
}
}
int ucd_isprint(codepoint_t c)
{
switch (ucd_lookup_category(c))
{
case UCD_CATEGORY_Cc:
case UCD_CATEGORY_Cf:
case UCD_CATEGORY_Cn:
case UCD_CATEGORY_Co:
case UCD_CATEGORY_Cs:
case UCD_CATEGORY_Ii:
return 0;
default:
return 1;
}
}
int ucd_ispunct(codepoint_t c)
{
return ucd_isgraph(c) && !ucd_isalnum(c);
}
int ucd_isspace(codepoint_t c)
{
switch (ucd_lookup_category(c))
{
case UCD_CATEGORY_Zl:
case UCD_CATEGORY_Zp:
return 1;
case UCD_CATEGORY_Zs:
switch (c) /* Exclude characters with the <noBreak> DispositionType */
{
case 0x00A0: /* U+00A0 : NO-BREAK SPACE */
case 0x2007: /* U+2007 : FIGURE SPACE */
case 0x202F: /* U+202F : NARROW NO-BREAK SPACE */
return 0;
}
return 1;
case UCD_CATEGORY_Cc:
switch (c) /* Include control characters marked as White_Space */
{
case 0x09: /* U+0009 : CHARACTER TABULATION */
case 0x0A: /* U+000A : LINE FEED */
case 0x0B: /* U+000B : LINE TABULATION */
case 0x0C: /* U+000C : FORM FEED */
case 0x0D: /* U+000D : CARRIAGE RETURN */
case 0x85: /* U+0085 : NEXT LINE */
return 1;
}
default:
return 0;
}
}
int ucd_isupper(codepoint_t c)
{
ucd_category cat = ucd_lookup_category(c);
switch (cat)
{
case UCD_CATEGORY_Lu:
return 1;
case UCD_CATEGORY_Lt:
return ucd_tolower(c) != c;
case UCD_CATEGORY_Nl:
case UCD_CATEGORY_So:
return (ucd_properties(c, cat) & UCD_PROPERTY_OTHER_UPPERCASE) == UCD_PROPERTY_OTHER_UPPERCASE;
default:
return 0;
}
}
int ucd_isxdigit(codepoint_t c)
{
return (c >= 0x30 && c <= 0x39) /* [0-9] */
|| (c >= 0x41 && c <= 0x46) /* [A-Z] */
|| (c >= 0x61 && c <= 0x66); /* [a-z] */
}