Branch :
/*
* Copyright © 2012 Ran Benita <ran234@gmail.com>
* SPDX-License-Identifier: MIT
*/
#include "config.h"
#include <assert.h>
#include <stdint.h>
#include "scanner-utils.h"
#include "xkbcomp-priv.h"
#include "parser-priv.h"
const char DECIMAL_SEPARATOR = '.';
static bool
number(struct scanner *s, int64_t *out, int *out_tok)
{
if (scanner_lit(s, "0x")) {
switch (scanner_hex_int64(s, out)) {
case -1:
*out_tok = ERROR_TOK;
return true;
case 0:
return false;
default:
*out_tok = INTEGER;
return true;
}
}
else {
switch (scanner_dec_int64(s, out)) {
case -1:
*out_tok = ERROR_TOK;
return true;
case 0:
return false;
default:
;
}
if (scanner_chr(s, DECIMAL_SEPARATOR)) {
/*
* Since the parser does not use floats, we do not care of the
* actual floating-point number value: we just need to ensure that
* the syntax is correct. So just truncate it!
*
* Note that `strtold` would not work reliably in our context,
* because it depends on the locale for e.g. the decimal separator
* (e.g. a period or a comma) and requires a null-terminated string,
* which we cannot guarantee.
*/
int64_t dec;
if (scanner_dec_int64(s, &dec) < 0) {
*out_tok = ERROR_TOK;
return true;
}
*out_tok = FLOAT;
} else {
*out_tok = INTEGER;
}
return true;
}
}
int
_xkbcommon_lex(YYSTYPE *yylval, struct scanner *s)
{
skip_more_whitespace_and_comments:
/* Skip spaces. */
while (is_space(scanner_peek(s))) scanner_next(s);
/* Skip comments. */
if (scanner_lit(s, "//") || scanner_chr(s, '#')) {
scanner_skip_to_eol(s);
goto skip_more_whitespace_and_comments;
}
/* See if we're done. */
if (scanner_eof(s)) return END_OF_FILE;
/* New token. */
s->token_pos = s->pos;
s->buf_pos = 0;
/* String literal. */
if (scanner_chr(s, '\"')) {
while (!scanner_eof(s) && !scanner_eol(s) && scanner_peek(s) != '\"') {
if (scanner_chr(s, '\\')) {
uint8_t o;
const size_t start_pos = s->pos;
if (scanner_chr(s, '\\')) scanner_buf_append(s, '\\');
else if (scanner_chr(s, '"')) scanner_buf_append(s, '"');
else if (scanner_chr(s, 'n')) scanner_buf_append(s, '\n');
else if (scanner_chr(s, 't')) scanner_buf_append(s, '\t');
else if (scanner_chr(s, 'r')) scanner_buf_append(s, '\r');
else if (scanner_chr(s, 'b')) scanner_buf_append(s, '\b');
else if (scanner_chr(s, 'f')) scanner_buf_append(s, '\f');
else if (scanner_chr(s, 'v')) scanner_buf_append(s, '\v');
else if (scanner_chr(s, 'e')) scanner_buf_append(s, '\x1b');
else if (scanner_chr(s, 'u')) {
/* Unicode escape sequence */
uint32_t cp = 0;
if (scanner_chr(s, '{') &&
scanner_unicode_code_point(s, &cp) &&
/* NOTE: the order of the check is important! */
scanner_chr(s, '}') && is_valid_char(cp)) {
/* Encode code point using UTF-8 */
scanner_buf_appends_code_point(s, cp);
} else {
scanner_warn(
s, XKB_WARNING_INVALID_UNICODE_ESCAPE_SEQUENCE,
"invalid Unicode escape sequence (%.*s) "
"in string literal",
(int) (s->pos - start_pos + 1),
&s->s[start_pos - 1]
);
/* Ignore. */
}
}
else if (scanner_oct(s, &o) && is_valid_char((uint32_t) o))
scanner_buf_append(s, (char) o);
else if (s->pos > start_pos) {
scanner_warn(s, XKB_WARNING_INVALID_ESCAPE_SEQUENCE,
"invalid octal escape sequence (%.*s) "
"in string literal",
(int) (s->pos - start_pos + 1),
&s->s[start_pos - 1]);
/* Ignore. */
}
else {
scanner_warn(s, XKB_WARNING_UNKNOWN_CHAR_ESCAPE_SEQUENCE,
"unknown escape sequence (\\%c) in string literal",
scanner_peek(s));
/* Ignore. */
}
} else {
scanner_buf_append(s, scanner_next(s));
}
}
if (!scanner_buf_append(s, '\0') || !scanner_chr(s, '\"')) {
scanner_err(s, XKB_LOG_MESSAGE_NO_ID,
"unterminated string literal");
return ERROR_TOK;
}
yylval->str = strdup(s->buf);
if (!yylval->str)
return ERROR_TOK;
return STRING;
}
/* Key name literal. */
if (scanner_chr(s, '<')) {
while (is_graph(scanner_peek(s)) && scanner_peek(s) != '>')
scanner_next(s);
if (!scanner_chr(s, '>')) {
scanner_err(s, XKB_LOG_MESSAGE_NO_ID,
"unterminated key name literal");
return ERROR_TOK;
}
/* Empty key name literals are allowed. */
const char *start = s->s + s->token_pos + 1;
const size_t len = s->pos - s->token_pos - 2;
yylval->atom = xkb_atom_intern(s->ctx, start, len);
return KEYNAME;
}
/* Operators and punctuation. */
if (scanner_chr(s, ';')) return SEMI;
if (scanner_chr(s, '{')) return OBRACE;
if (scanner_chr(s, '}')) return CBRACE;
if (scanner_chr(s, '=')) return EQUALS;
if (scanner_chr(s, '[')) return OBRACKET;
if (scanner_chr(s, ']')) return CBRACKET;
if (scanner_chr(s, '(')) return OPAREN;
if (scanner_chr(s, ')')) return CPAREN;
if (scanner_chr(s, '.')) return DOT;
if (scanner_chr(s, ',')) return COMMA;
if (scanner_chr(s, '+')) return PLUS;
if (scanner_chr(s, '-')) return MINUS;
if (scanner_chr(s, '*')) return TIMES;
if (scanner_chr(s, '/')) return DIVIDE;
if (scanner_chr(s, '!')) return EXCLAM;
if (scanner_chr(s, '~')) return INVERT;
int tok = ERROR_TOK;
/* Identifier. */
if (is_alpha(scanner_peek(s)) || scanner_peek(s) == '_') {
while (is_alnum(scanner_peek(s)) || scanner_peek(s) == '_')
scanner_next(s);
const char *start = s->s + s->token_pos;
const size_t len = s->pos - s->token_pos;
/* Keyword. */
tok = keyword_to_token(start, len);
if (tok >= 0) return tok;
yylval->sval = SVAL(start, len);
return IDENT;
}
/* Number literal (hexadecimal / decimal / float). */
if (number(s, &yylval->num, &tok)) {
if (tok == ERROR_TOK) {
scanner_err(s, XKB_ERROR_MALFORMED_NUMBER_LITERAL,
"malformed number literal");
return ERROR_TOK;
}
return tok;
}
scanner_err(s, XKB_LOG_MESSAGE_NO_ID,
"unrecognized token");
return ERROR_TOK;
}
XkbFile *
XkbParseString(struct xkb_context *ctx, const char *string, size_t len,
const char *file_name, const char *map)
{
struct scanner scanner;
scanner_init(&scanner, ctx, string, len, file_name, NULL);
/* Basic detection of wrong character encoding.
The first character relevant to the grammar must be ASCII:
whitespace, section, comment */
if (!scanner_check_supported_char_encoding(&scanner)) {
scanner_err(&scanner, XKB_ERROR_INVALID_FILE_ENCODING,
"This could be a file encoding issue. "
"Supported encodings must be backward compatible with ASCII.");
scanner_err(&scanner, XKB_ERROR_INVALID_FILE_ENCODING,
"E.g. ISO/CEI 8859 and UTF-8 are supported "
"but UTF-16, UTF-32 and CP1026 are not.");
return NULL;
}
return parse(ctx, &scanner, map);
}
XkbFile *
XkbParseFile(struct xkb_context *ctx, FILE *file,
const char *file_name, const char *map)
{
bool ok;
XkbFile *xkb_file;
char *string;
size_t size;
ok = map_file(file, &string, &size);
if (!ok) {
log_err(ctx, XKB_LOG_MESSAGE_NO_ID,
"Couldn't read XKB file %s: %s\n",
file_name, strerror(errno));
return NULL;
}
xkb_file = XkbParseString(ctx, string, size, file_name, map);
unmap_file(string, size);
return xkb_file;
}