aboutsummaryrefslogblamecommitdiff
path: root/utils/chargen.c
blob: d6fa86a20bd2ac3334e6af68c2f0ec203f48d9e3 (plain) (tree)































































































































                                                                                                                    
/* Copyright (c) 2013, Vsevolod Stakhov
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 *       * Redistributions of source code must retain the above copyright
 *         notice, this list of conditions and the following disclaimer.
 *       * Redistributions in binary form must reproduce the above copyright
 *         notice, this list of conditions and the following disclaimer in the
 *         documentation and/or other materials provided with the distribution.
 *
 * THIS SOFTWARE IS PROVIDED ''AS IS'' AND ANY
 * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
 * DISCLAIMED. IN NO EVENT SHALL AUTHOR BE LIABLE FOR ANY
 * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
 * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 */

/**
 * @file this utility generates character table for ucl
 */

#include <stdio.h>
#include <ctype.h>
#include <stdbool.h>

static inline int
print_flag (const char *flag, bool *need_or, char *val)
{
	int res;
	res = sprintf (val, "%s%s", *need_or ? "|" : "", flag);

	*need_or |= true;

	return res;
}

int
main (int argc, char **argv)
{
	int i, col, r;
	const char *name = "ucl_chartable";
	bool need_or;
	char valbuf[2048];

	col = 0;

	if (argc > 1) {
		name = argv[1];
	}

	printf ("static const unsigned int %s[255] = {\n", name);

	for (i = 0; i < 255; i ++) {
		need_or = false;
		r = 0;
		/* UCL_CHARACTER_VALUE_END */

		if (i == ' ' || i == '\t') {
			r += print_flag ("UCL_CHARACTER_WHITESPACE", &need_or, valbuf + r);
		}
		if (isspace (i)) {
			r += print_flag ("UCL_CHARACTER_WHITESPACE_UNSAFE", &need_or, valbuf + r);
		}
		if (isalnum (i) || i >= 0x80 || i == '/' || i == '_') {
			r += print_flag ("UCL_CHARACTER_KEY_START", &need_or, valbuf + r);
		}
		if (isalnum (i) || i == '-' || i == '_' || i == '/' || i == '.' || i >= 0x80) {
			r += print_flag ("UCL_CHARACTER_KEY", &need_or, valbuf + r);
		}
		if (i == 0 || i == '\r' || i == '\n' || i == ']' || i == '}' || i == ';' || i == ',' || i == '#') {
			r += print_flag ("UCL_CHARACTER_VALUE_END", &need_or, valbuf + r);
		}
		else {
			if (isprint (i) || i >= 0x80) {
				r += print_flag ("UCL_CHARACTER_VALUE_STR", &need_or, valbuf + r);
			}
			if (isdigit (i) || i == '-') {
				r += print_flag ("UCL_CHARACTER_VALUE_DIGIT_START", &need_or, valbuf + r);
			}
			if (isalnum (i) || i == '.' || i == '-' || i == '+') {
				r += print_flag ("UCL_CHARACTER_VALUE_DIGIT", &need_or, valbuf + r);
			}
		}
		if (i == '"' || i == '\\' || i == '/' || i == 'b' ||
			i == 'f' || i == 'n' || i == 'r' || i == 't' || i == 'u') {
			r += print_flag ("UCL_CHARACTER_ESCAPE", &need_or, valbuf + r);
		}
		if (i == ' ' || i == '\t' || i == ':' || i == '=') {
			r += print_flag ("UCL_CHARACTER_KEY_SEP", &need_or, valbuf + r);
		}
		if (i == '\n' || i == '\r' || i == '\\' || i == '\b' || i == '\t' ||
				i == '"' || i == '\f') {
			r += print_flag ("UCL_CHARACTER_JSON_UNSAFE", &need_or, valbuf + r);
		}
		if (i == '\n' || i == '\r' || i == '\\' || i == '\b' || i == '\t' ||
				i == '"' || i == '\f' || i == '=' || i == ':' || i == '{' || i == '[' || i == ' ') {
			r += print_flag ("UCL_CHARACTER_UCL_UNSAFE", &need_or, valbuf + r);
		}

		if (!need_or) {
			r += print_flag ("UCL_CHARACTER_DENIED", &need_or, valbuf + r);
		}

		if (isprint (i)) {
			r += sprintf (valbuf + r, " /* %c */", i);
		}
		if (i != 254) {
			r += sprintf (valbuf + r, ", ");
		}
		col += r;
		if (col > 80) {
			printf ("\n%s", valbuf);
			col = r;
		}
		else {
			printf ("%s", valbuf);
		}
	}
	printf ("\n}\n");

	return 0;
}