/* Test of line breaking of UTF-8 strings.
- Copyright (C) 2008 Free Software Foundation, Inc.
+ Copyright (C) 2008-2013 Free Software Foundation, Inc.
This program is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
#include "unilbrk.h"
-#include <stdio.h>
#include <stdlib.h>
-#define SIZEOF(array) (sizeof (array) / sizeof (array[0]))
-#define ASSERT(expr) \
- do \
- { \
- if (!(expr)) \
- { \
- fprintf (stderr, "%s:%d: assertion failed\n", __FILE__, __LINE__); \
- fflush (stderr); \
- abort (); \
- } \
- } \
- while (0)
+#include "macros.h"
int
main ()
u8_possible_linebreaks (input, SIZEOF (input), "GB18030", p);
for (i = 0; i < 91; i++)
- {
- ASSERT (p[i] == (i == 90 ? UC_BREAK_MANDATORY :
- i == 7
- || i == 13 || i == 39
- || i == 41 || i == 43 || i == 44 || i == 50
- || i == 55 || i == 61 || i == 67
- || i == 70 || i == 73 || i == 77 || i == 80
- || i == 84 || i == 87 ? UC_BREAK_POSSIBLE :
- UC_BREAK_PROHIBITED));
- }
+ {
+ ASSERT (p[i] == (i == 90 ? UC_BREAK_MANDATORY :
+ i == 7
+ || i == 13 || i == 39
+ || i == 43 || i == 44
+ || i == 61 || i == 67
+ || i == 70 || i == 73 || i == 77 || i == 80
+ || i == 84 || i == 87 ? UC_BREAK_POSSIBLE :
+ UC_BREAK_PROHIBITED));
+ }
free (p);
}
u8_possible_linebreaks (input, SIZEOF (input), "GB2312", p);
for (i = 0; i < 91; i++)
- {
- ASSERT (p[i] == (i == 90 ? UC_BREAK_MANDATORY :
- i == 2 || i == 4 || i == 7
- || (i >= 13 && i <= 35 && (i % 2) != 0) || i == 39
- || i == 41 || i == 43 || i == 44 || i == 50
- || i == 52 || i == 55 || i == 61 || i == 67
- || i == 70 || i == 73 || i == 77 || i == 80
- || i == 84 || i == 87 ? UC_BREAK_POSSIBLE :
- UC_BREAK_PROHIBITED));
- }
+ {
+ ASSERT (p[i] == (i == 90 ? UC_BREAK_MANDATORY :
+ i == 7
+ || i == 13 || i == 39
+ || i == 43 || i == 44
+ || i == 52 || i == 61 || i == 67
+ || i == 70 || i == 73 || i == 77 || i == 80
+ || i == 84 || i == 87 ? UC_BREAK_POSSIBLE :
+ UC_BREAK_PROHIBITED));
+ }
free (p);
}
}
+ /* Test that a break is possible after a zero-width space followed by some
+ regular spaces (rule LB8 in Unicode TR#14 revision 26). */
+ {
+ static const uint8_t input[6] = "x\342\200\213 y";
+ char *p = (char *) malloc (SIZEOF (input));
+ size_t i;
+
+ u8_possible_linebreaks (input, SIZEOF (input), "UTF-8", p);
+ for (i = 0; i < 4; i++)
+ {
+ ASSERT (p[i] == (i == 5 ? UC_BREAK_POSSIBLE : UC_BREAK_PROHIBITED));
+ }
+ free (p);
+ }
+
return 0;
}