creole/test_creole.c

207 lines
4.4 KiB
C
Raw Normal View History

2023-02-05 06:44:37 -05:00
#include "greatest.h"
GREATEST_MAIN_DEFS();
#include "creole.c"
/**************************************************************************
2023-02-06 23:38:39 -05:00
* Reader
2023-02-05 06:44:37 -05:00
*************************************************************************/
#define reader_lit(r, s) do { \
r.p = (unsigned char *)s; \
r.left = sizeof(s) - 1; \
} while(0)
TEST reader_test_basic(struct creole_reader *r) {
size_t i = 0;
unsigned char *s = r->p;
size_t len = r->left;
for (i = 0; i < len; i++) {
ASSERT_EQ(read_eof(r), 0);
ASSERT_EQ(read(r), s[i]);
}
for (i = 0; i < 5; i++) {
ASSERT_EQ(read_eof(r), 1);
ASSERT_EQ(read(r), -1);
}
PASS();
}
SUITE(reader) {
struct creole_reader r = {0};
reader_lit(r, "abcdefg");
RUN_TEST1(reader_test_basic, &r);
reader_lit(r, "");
RUN_TEST1(reader_test_basic, &r);
}
2023-02-06 23:38:39 -05:00
/**************************************************************************
* Pseudo UTF-8 sequences
*************************************************************************/
TEST no_values(void) {
struct creole_reader r;
struct word w;
r.p = NULL;
r.left = 0;
ASSERT_EQ(decode_seq(&r, &w), 0);
PASS();
}
struct seq {
creole_word max;
unsigned encode_to;
unsigned high_bits;
unsigned char minbuf[7];
unsigned char maxbuf[7];
};
void bprint(unsigned char c) {
int i;
for (i = 0; i < 8; i++) {
printf("%u", (c >> (7 - i)) & 1);
}
}
void bprintb(unsigned char *b, int len) {
while (len-- > 0) {
bprint(*b++);
printf(" ");
}
}
TEST encode_byte_seq(struct seq *s) {
creole_word i = 0;
int j;
unsigned char buf[7];
for (;;) {
printf("0x%X ", i);
bprintb(s->minbuf, s->encode_to);
printf("\n");
ASSERT_EQ(creole_encode(i, s->encode_to, s->high_bits,
buf), 1);
ASSERT_MEM_EQ(s->minbuf, buf, s->encode_to);
if (i == s->max)
break;
i++;
for (j = s->encode_to - 1; j > 0; j--) {
if (s->minbuf[j] == 0xBF) {
s->minbuf[j] = 0x80;
} else {
s->minbuf[j]++;
break;
}
}
if (j == 0)
s->minbuf[0]++;
}
ASSERT_MEM_EQ(s->maxbuf, s->minbuf, s->encode_to);
PASS();
}
TEST encode_decode_byte_seq(struct seq *s) {
unsigned char buf[7];
struct creole_reader r = {0};
struct word w;
creole_word i = 0;
for (;;) {
ASSERT_EQ(creole_encode(i, s->encode_to, s->high_bits,
buf), 1);
r.p = buf;
r.left = s->encode_to;
ASSERT_EQ(decode_seq(&r, &w), 1);
ASSERT_EQ(w.len, s->encode_to);
ASSERT_EQ(w.high_bits, s->high_bits);
ASSERT_EQ(w.word, i);
if (i == s->max)
break;
i++;
}
PASS();
}
SUITE(pseudo_utf8_encode_all) {
struct seq s;
RUN_TEST(no_values);
s.max = 0x7F;
s.encode_to = 1;
s.high_bits = 0;
s.minbuf[0] = 0x00;
s.maxbuf[0] = 0x7F;
RUN_TEST1(encode_byte_seq, &s);
for (s.high_bits = 0; s.high_bits < 16; s.high_bits++) {
memset(s.maxbuf, 0xBF, sizeof(s.maxbuf));
2023-02-06 23:50:50 -05:00
memset(s.minbuf, 0x80, sizeof(s.minbuf));
2023-02-06 23:38:39 -05:00
s.max = 0x7F;
s.encode_to = 2;
s.maxbuf[0] = s.minbuf[0] = 0xC0 | (s.high_bits << 1);
s.maxbuf[0] = 0xC1 | (s.high_bits << 1);
s.minbuf[1] = 0x80;
RUN_TEST1(encode_byte_seq, &s);
2023-02-06 23:50:50 -05:00
memset(s.minbuf, 0x80, sizeof(s.minbuf));
2023-02-06 23:38:39 -05:00
s.max = 0xFFF;
s.encode_to = 3;
s.minbuf[0] = 0xE0 | s.high_bits;
s.maxbuf[0] = 0xE0 | s.high_bits;
s.minbuf[1] = 0x80;
RUN_TEST1(encode_byte_seq, &s);
2023-02-06 23:50:50 -05:00
memset(s.minbuf, 0x80, sizeof(s.minbuf));
2023-02-06 23:38:39 -05:00
s.max = 0x1FFFF;
s.encode_to = 4;
s.maxbuf[0] = s.minbuf[0] = 0xF0 | (s.high_bits >> 1);
2023-02-06 23:50:50 -05:00
s.minbuf[1] = 0x80 | ((s.high_bits & 0x1) << 5);
s.maxbuf[1] = 0x9F | ((s.high_bits & 0x1) << 5);
2023-02-06 23:38:39 -05:00
RUN_TEST1(encode_byte_seq, &s);
2023-02-06 23:50:50 -05:00
memset(s.minbuf, 0x80, sizeof(s.minbuf));
2023-02-06 23:38:39 -05:00
s.max = 0x3FFFFF;
s.encode_to = 5;
s.maxbuf[0] = s.minbuf[0] = 0xF8 | (s.high_bits >> 2);
2023-02-06 23:50:50 -05:00
s.minbuf[1] = 0x80 | ((s.high_bits & 0x3) << 4);
s.maxbuf[1] = 0x8F | ((s.high_bits & 0x3) << 4);
2023-02-06 23:38:39 -05:00
2023-02-06 23:50:50 -05:00
memset(s.minbuf, 0x80, sizeof(s.minbuf));
2023-02-06 23:38:39 -05:00
s.max = 0x7FFFFFF;
s.encode_to = 6;
s.maxbuf[0] = s.minbuf[0] = 0xFC | (s.high_bits >> 3);
2023-02-06 23:50:50 -05:00
s.minbuf[1] = 0x80 | ((s.high_bits & 0x7) << 3);
s.maxbuf[1] = 0x87 | ((s.high_bits & 0x7) << 3);
2023-02-06 23:38:39 -05:00
RUN_TEST1(encode_byte_seq, &s);
2023-02-06 23:50:50 -05:00
memset(s.minbuf, 0x80, sizeof(s.minbuf));
2023-02-06 23:38:39 -05:00
s.max = 0xFFFFFFFF;
s.encode_to = 7;
s.maxbuf[0] = s.minbuf[0] = 0xFE;
s.minbuf[1] = 0x80 | (s.high_bits << 2);
s.maxbuf[1] = 0x83 | (s.high_bits << 2);
RUN_TEST1(encode_byte_seq, &s);
}
}
2023-02-05 06:44:37 -05:00
int main(int argc, char *argv[]) {
GREATEST_MAIN_BEGIN();
RUN_SUITE(reader);
2023-02-06 23:38:39 -05:00
RUN_SUITE(pseudo_utf8_encode_all);
2023-02-05 06:44:37 -05:00
GREATEST_MAIN_END();
}