55 lines
		
	
	
		
			1.6 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			55 lines
		
	
	
		
			1.6 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /* Common functions and includes for our test programs. */
 | |
| 
 | |
| #include <stdio.h>
 | |
| #include <stdlib.h>
 | |
| #include <ctype.h>
 | |
| #include <string.h>
 | |
| #include <stdarg.h>
 | |
| 
 | |
| #include "../utf8proc.h"
 | |
| 
 | |
| size_t lineno = 0;
 | |
| 
 | |
| void check(int cond, const char *format, ...)
 | |
| {
 | |
|      if (!cond) {
 | |
|           va_list args;
 | |
|           fprintf(stderr, "line %zd: ", lineno);
 | |
|           va_start(args, format);
 | |
|           vfprintf(stderr, format, args);
 | |
|           va_end(args);
 | |
|           fprintf(stderr, "\n");
 | |
|           exit(1);
 | |
|      }
 | |
| }
 | |
| 
 | |
| size_t skipspaces(const char *buf, size_t i)
 | |
| {
 | |
|     while (isspace(buf[i])) ++i;
 | |
|     return i;
 | |
| }
 | |
| 
 | |
| /* if buf points to a sequence of codepoints encoded as hexadecimal strings,
 | |
|    separated by whitespace, and terminated by any character not in
 | |
|    [0-9a-fA-F] or whitespace, then stores the corresponding utf8 string
 | |
|    in dest, returning the number of bytes read from buf */
 | |
| utf8proc_ssize_t unsafe_encode_char(utf8proc_int32_t uc, utf8proc_uint8_t *dst);
 | |
| size_t encode(char *dest, const char *buf)
 | |
| {
 | |
|      size_t i = 0, j, d = 0;
 | |
|      for (;;) {
 | |
|           int c;
 | |
|           i = skipspaces(buf, i);
 | |
|           for (j=i; buf[j] && strchr("0123456789abcdef", tolower(buf[j])); ++j)
 | |
|                ; /* find end of hex input */
 | |
|           if (j == i) { /* no codepoint found */
 | |
|                dest[d] = 0; /* NUL-terminate destination string */
 | |
|                return i + 1;
 | |
|           }
 | |
|           check(sscanf(buf + i, "%x", (unsigned int *)&c) == 1, "invalid hex input %s", buf+i);
 | |
|           i = j; /* skip to char after hex input */
 | |
|           d += unsafe_encode_char(c, (utf8proc_uint8_t *) (dest + d));
 | |
|      }
 | |
| }
 | |
| 
 |