55 lines
		
	
	
		
			1.6 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
		
		
			
		
	
	
			55 lines
		
	
	
		
			1.6 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
|   | /* Common functions and includes for our test programs. */ | ||
|  | 
 | ||
|  | #include <stdio.h>
 | ||
|  | #include <stdlib.h>
 | ||
|  | #include <ctype.h>
 | ||
|  | #include <string.h>
 | ||
|  | #include <stdarg.h>
 | ||
|  | 
 | ||
|  | #include "../utf8proc.h"
 | ||
|  | 
 | ||
|  | size_t lineno = 0; | ||
|  | 
 | ||
|  | void check(int cond, const char *format, ...) | ||
|  | { | ||
|  |      if (!cond) { | ||
|  |           va_list args; | ||
|  |           fprintf(stderr, "line %zd: ", lineno); | ||
|  |           va_start(args, format); | ||
|  |           vfprintf(stderr, format, args); | ||
|  |           va_end(args); | ||
|  |           fprintf(stderr, "\n"); | ||
|  |           exit(1); | ||
|  |      } | ||
|  | } | ||
|  | 
 | ||
|  | size_t skipspaces(const char *buf, size_t i) | ||
|  | { | ||
|  |     while (isspace(buf[i])) ++i; | ||
|  |     return i; | ||
|  | } | ||
|  | 
 | ||
|  | /* if buf points to a sequence of codepoints encoded as hexadecimal strings,
 | ||
|  |    separated by whitespace, and terminated by any character not in | ||
|  |    [0-9a-fA-F] or whitespace, then stores the corresponding utf8 string | ||
|  |    in dest, returning the number of bytes read from buf */ | ||
|  | utf8proc_ssize_t unsafe_encode_char(utf8proc_int32_t uc, utf8proc_uint8_t *dst); | ||
|  | size_t encode(char *dest, const char *buf) | ||
|  | { | ||
|  |      size_t i = 0, j, d = 0; | ||
|  |      for (;;) { | ||
|  |           int c; | ||
|  |           i = skipspaces(buf, i); | ||
|  |           for (j=i; buf[j] && strchr("0123456789abcdef", tolower(buf[j])); ++j) | ||
|  |                ; /* find end of hex input */ | ||
|  |           if (j == i) { /* no codepoint found */ | ||
|  |                dest[d] = 0; /* NUL-terminate destination string */ | ||
|  |                return i + 1; | ||
|  |           } | ||
|  |           check(sscanf(buf + i, "%x", (unsigned int *)&c) == 1, "invalid hex input %s", buf+i); | ||
|  |           i = j; /* skip to char after hex input */ | ||
|  |           d += unsafe_encode_char(c, (utf8proc_uint8_t *) (dest + d)); | ||
|  |      } | ||
|  | } | ||
|  | 
 |