/*
Copyright (C) 2016 Alexander Borisov
This library is free software; you can redistribute it and/or
modify it under the terms of the GNU Lesser General Public
License as published by the Free Software Foundation; either
version 2.1 of the License, or (at your option) any later version.
This library is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
Lesser General Public License for more details.
You should have received a copy of the GNU Lesser General Public
License along with this library; if not, write to the Free Software
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
Author: lex.borisov@gmail.com (Alexander Borisov)
*/
#include "mycss/tokenizer.h"
#include "mycss/tokenizer_resource.h"
#include "myhtml/utils/resources.h"
mycss_status_t mycss_tokenizer_chunk(mycss_entry_t* entry, const char* css, size_t css_length)
{
entry->current_buffer = myhtml_incomming_buffer_add(entry->current_buffer, entry->mcobject_incoming_buffer,
css, css_length);
if(entry->current_buffer == NULL)
return MyCSS_STATUS_ERROR_TOKENIZER_INCOMING_BUFFER_ADD;
// first init
if(entry->first_buffer == NULL)
entry->first_buffer = entry->current_buffer;
if(entry->token == NULL) {
entry->token = (mycss_token_t*)myhtml_calloc(1, sizeof(mycss_token_t));
if(entry->token == NULL)
return MyCSS_STATUS_ERROR_TOKENIZER_TOKEN_ALLOCATION;
}
return mycss_tokenizer_process(entry, css, css_length);
}
mycss_status_t mycss_tokenizer_process(mycss_entry_t* entry, const char* css, size_t css_length)
{
/*
Why use utf-8 when the declaration says utf-16?
The bytes of the encoding declaration spell out “@charset "…";” in ASCII,
but UTF-16 is not ASCII-compatible. Either you’ve typed in complete gibberish (like 䁣桡牳整•utf-16be∻)
to get the right bytes in the document, which we don’t want to encourage,
or your document is actually in an ASCII-compatible encoding and your encoding declaration is lying.
Either way, defaulting to UTF-8 is a decent answer.
As well, this mimics the behavior of HTML’s attribute.
*/
if(entry->encoding == MyHTML_ENCODING_UTF_16LE || entry->encoding == MyHTML_ENCODING_UTF_16BE)
entry->encoding = MyHTML_ENCODING_UTF_8;
mycss_t* mycss = entry->mycss;
mycss_tokenizer_state_f* state_f = mycss->parse_state_func;
myhtml_incoming_buffer_t *current = entry->current_buffer;
do {
myhtml_incoming_buffer_t *mt = entry->current_buffer;
mt->length = 0;
while (mt->length < mt->size) {
mt->length = state_f[entry->state](entry, entry->token, mt->data, mt->length, mt->size);
}
entry->current_buffer = mt->next;
}
while(entry->current_buffer);
entry->current_buffer = current;
return MyCSS_STATUS_OK;
}
mycss_status_t mycss_tokenizer_end(mycss_entry_t* entry)
{
mycss_t* mycss = entry->mycss;
mycss_tokenizer_state_f* state_f = mycss->parse_state_func;
if(entry->state != MyCSS_TOKENIZER_STATE_DATA)
{
myhtml_incoming_buffer_t *mt = entry->current_buffer;
size_t end_state = (MyCSS_TOKENIZER_STATE_LAST_ENTRY + entry->state);
mt->length = state_f[end_state](entry, entry->token, mt->data, mt->length, mt->size);
}
entry->type |= MyCSS_ENTRY_TYPE_END;
return MyCSS_STATUS_OK;
}
size_t mycss_tokenizer_run_state_single(mycss_entry_t* entry, mycss_tokenizer_state_t state, const char* css, size_t css_offset, size_t css_size)
{
mycss_t* mycss = entry->mycss;
mycss_tokenizer_state_f* state_f = mycss->parse_state_func;
return state_f[state](entry, entry->token, css, css_offset, css_size);
}
size_t mycss_tokenizer_state_set_current_buffer_for_continue(mycss_entry_t* entry, size_t css_offset, size_t css_minus_offset)
{
if(css_minus_offset == 0)
return css_offset;
if(css_offset >= css_minus_offset)
return css_offset;
myhtml_incoming_buffer_t *buffer = entry->current_buffer;
size_t need = (css_minus_offset - css_offset);
size_t position = buffer->offset - need;
while(buffer && buffer->offset > position)
buffer = buffer->prev;
entry->current_buffer = buffer;
return (position - buffer->offset);
}
size_t mycss_tokenizer_token_strcasecmp(mycss_entry_t* entry, mycss_token_t* token, const char* to, size_t to_length)
{
myhtml_incoming_buffer_t *buffer = myhtml_incoming_buffer_find_by_position(entry->current_buffer, token->begin);
size_t token_offset = token->begin - buffer->offset;
return myhtml_incoming_buffer_escaped_case_cmp(&buffer, to, to_length, &token_offset);
}
//////////////////////
// Begin All State
//
size_t mycss_tokenizer_state_data(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
token->begin = entry->current_buffer->offset + css_offset;
token->data = &css[css_offset];
entry->state = mycss_begin_chars_state_map[ (const unsigned char)css[css_offset] ];
css_offset++;
return css_offset;
}
/////////////////////////////////////////////////////////
//// whitespace
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_whitespace(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
const unsigned char *u_css = (const unsigned char*)css;
while(css_offset < css_size)
{
if(mycss_begin_chars_state_map[ u_css[css_offset] ] != MyCSS_TOKENIZER_STATE_WHITESPACE)
{
token->length = (entry->current_buffer->offset + css_offset) - token->begin;
token->type = MyCSS_TOKEN_TYPE_WHITESPACE;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
break;
}
css_offset++;
}
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+0022 QUOTATION MARK (")
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_quotation_mark(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
// skip QUOTATION MARK (")
token->begin += 1;
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_STRING_DOUBLE_QUOTED;
entry->state_back = MyCSS_TOKENIZER_STATE_QUOTATION_MARK_BACK;
return css_offset;
}
size_t mycss_tokenizer_state_quotation_mark_back(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+0023 NUMBER SIGN (#)
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_number_sign(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
const unsigned char *u_css = (const unsigned char*)css;
if(mycss_chars_name_code_point_map[ u_css[css_offset] ] != 0xff)
{
token->begin++;
css_offset++;
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_NAME;
entry->state_back = MyCSS_TOKENIZER_STATE_NUMBER_SIGN_NAME_BACK;
}
else if(css[css_offset] == '\\') {
css_offset++;
if(css_offset >= css_size) {
entry->state = MyCSS_TOKENIZER_STATE_NUMBER_SIGN_NAME_RSOLIDUS;
return css_offset;
}
if(css[css_offset] == '\n' || css[css_offset] == '\r' || css[css_offset] == 0x0C) {
css_offset--;
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_DELIM;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
}
else {
token->begin++;
css_offset++;
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_NAME;
entry->state_back = MyCSS_TOKENIZER_STATE_NUMBER_SIGN_NAME_BACK;
}
}
else {
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_DELIM;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
}
return css_offset;
}
size_t mycss_tokenizer_state_number_sign_name_back(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
token->type = MyCSS_TOKEN_TYPE_HASH;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
return css_offset;
}
size_t mycss_tokenizer_state_number_sign_name_rsolidus(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(css[css_offset] == '\n' || css[css_offset] == '\r' || css[css_offset] == 0x0C) {
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_DELIM;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
return mycss_tokenizer_state_set_current_buffer_for_continue(entry, css_offset, 1);
}
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_NAME;
entry->state_back = MyCSS_TOKENIZER_STATE_NUMBER_SIGN_NAME_BACK;
token->begin++;
css_offset++;
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+0024 DOLLAR SIGN ($)
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_dollar_sign(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(css[css_offset] == '=') {
css_offset++;
token->length = 2;
token->type = MyCSS_TOKEN_TYPE_SUFFIX_MATCH;
}
else {
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_DELIM;
}
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+0027 APOSTROPHE (')
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_apostrophe(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
// skip APOSTROPHE (')
token->begin += 1;
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_STRING_SINGLE_QUOTED;
entry->state_back = MyCSS_TOKENIZER_STATE_QUOTATION_MARK_BACK;
return css_offset;
}
size_t mycss_tokenizer_state_apostrophe_back(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+0028 LEFT PARENTHESIS (()
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_left_parenthesis(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_LEFT_PARENTHESIS;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+0029 RIGHT PARENTHESIS ())
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_right_parenthesis(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_RIGHT_PARENTHESIS;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+002A ASTERISK (*)
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_asterisk(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(css[css_offset] == '=') {
css_offset++;
token->length = 2;
token->type = MyCSS_TOKEN_TYPE_SUBSTRING_MATCH;
}
else {
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_DELIM;
}
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+002B PLUS SIGN (+)
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_plus_sign(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(css[css_offset] >= '0' && css[css_offset] <= '9') {
css_offset++;
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_NUMBER_DIGIT;
entry->state_back = MyCSS_TOKENIZER_GLOBAL_STATE_NUMERIC;
}
else if(css[css_offset] == '.') {
css_offset++;
entry->state = MyCSS_TOKENIZER_STATE_PLUS_SIGN_FULL_STOP;
}
else {
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_DELIM;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
}
return css_offset;
}
size_t mycss_tokenizer_state_plus_sign_full_stop(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(css[css_offset] >= '0' && css[css_offset] <= '9') {
css_offset++;
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_NUMBER_DECIMAL;
entry->state_back = MyCSS_TOKENIZER_GLOBAL_STATE_NUMERIC;
}
else {
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_DELIM;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
return mycss_tokenizer_state_set_current_buffer_for_continue(entry, css_offset, 1);
}
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+002C COMMA (,)
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_comma(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_COMMA;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+002D HYPHEN-MINUS (-)
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_hyphen_minus(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
const unsigned char *u_css = (const unsigned char*)css;
// If the input stream starts with a number, reconsume the current input code point,
// consume a numeric token, and return it.
if(css[css_offset] >= '0' && css[css_offset] <= '9') {
css_offset++;
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_NUMBER_DIGIT;
entry->state_back = MyCSS_TOKENIZER_GLOBAL_STATE_NUMERIC;
}
else if(css[css_offset] == '.') {
css_offset++;
entry->state = MyCSS_TOKENIZER_STATE_HYPHEN_MINUS_FULL_STOP;
}
// Otherwise, if the input stream starts with an identifier,
// reconsume the current input code point, consume an ident-like token, and return it.
// and check
// Otherwise, if the next 2 input code points are U+002D HYPHEN-MINUS
// U+003E GREATER-THAN SIGN (->), consume them and return a .
else if(css[css_offset] == '-') {
css_offset++;
entry->state = MyCSS_TOKENIZER_STATE_HYPHEN_MINUS_MINUS;
}
// Otherwise, if the input stream starts with an identifier,
// reconsume the current input code point, consume an ident-like token, and return it.
else if(mycss_begin_chars_state_map[ u_css[css_offset] ] == MyCSS_TOKENIZER_STATE_NAME_START_CODE_POINT) {
css_offset++;
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_NAME;
entry->state_back = MyCSS_TOKENIZER_GLOBAL_STATE_IDENT;
}
else if(css[css_offset] == '\\') {
css_offset++;
entry->state = MyCSS_TOKENIZER_STATE_HYPHEN_MINUS_RSOLIDUS;
}
// Otherwise, return a with its value set to the current input code point.
else {
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_DELIM;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
}
return css_offset;
}
size_t mycss_tokenizer_state_hyphen_minus_full_stop(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(css[css_offset] >= '0' && css[css_offset] <= '9') {
css_offset++;
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_NUMBER_DECIMAL;
entry->state_back = MyCSS_TOKENIZER_GLOBAL_STATE_NUMERIC;
}
else {
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_DELIM;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
return mycss_tokenizer_state_set_current_buffer_for_continue(entry, css_offset, 1);
}
return css_offset;
}
size_t mycss_tokenizer_state_hyphen_minus_minus(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(css[css_offset] == '>') {
css_offset++;
token->length = 3;
token->type = MyCSS_TOKEN_TYPE_CDC;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
}
else if(mycss_begin_chars_state_map[ ((const unsigned char *)css)[css_offset] ] == MyCSS_TOKENIZER_STATE_NAME_START_CODE_POINT) {
css_offset++;
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_NAME;
entry->state_back = MyCSS_TOKENIZER_GLOBAL_STATE_IDENT;
}
else if(css[css_offset] == '\\') {
css_offset++;
entry->state = MyCSS_TOKENIZER_STATE_HYPHEN_MINUS_MINUS_RSOLIDUS;
}
else {
token->length = 1; // only '-'
token->type = MyCSS_TOKEN_TYPE_DELIM;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
css_offset = mycss_tokenizer_state_set_current_buffer_for_continue(entry, css_offset, 1);
}
return css_offset;
}
size_t mycss_tokenizer_state_hyphen_minus_minus_rsolidus(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(css[css_offset] == '\n' || css[css_offset] == '\r' || css[css_offset] == 0x0C) {
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_DELIM;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
css_offset = mycss_tokenizer_state_set_current_buffer_for_continue(entry, css_offset, 2);
}
else {
css_offset++;
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_NAME;
entry->state_back = MyCSS_TOKENIZER_GLOBAL_STATE_IDENT;
}
return css_offset;
}
size_t mycss_tokenizer_state_hyphen_minus_rsolidus(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(css[css_offset] == '\n' || css[css_offset] == '\r' || css[css_offset] == 0x0C) {
token->length = 1; // only '-'
token->type = MyCSS_TOKEN_TYPE_DELIM;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
css_offset = mycss_tokenizer_state_set_current_buffer_for_continue(entry, css_offset, 1);
}
else {
css_offset++;
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_NAME;
entry->state_back = MyCSS_TOKENIZER_GLOBAL_STATE_IDENT;
}
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+002E FULL STOP (.)
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_full_stop(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(css[css_offset] >= '0' && css[css_offset] <= '9') {
css_offset++;
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_NUMBER_DECIMAL;
entry->state_back = MyCSS_TOKENIZER_GLOBAL_STATE_NUMERIC;
}
else {
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_DELIM;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
}
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+002F SOLIDUS (/)
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_solidus(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(css[css_offset] == '*') {
css_offset++;
entry->state = MyCSS_TOKENIZER_STATE_SOLIDUS_COMMENT_END;
}
else {
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_DELIM;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
}
return css_offset;
}
size_t mycss_tokenizer_state_solidus_comment_end(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
while(css_offset < css_size)
{
if(css[css_offset] == '/') {
if(css_offset == 0)
{
myhtml_incoming_buffer_t *buffer = entry->current_buffer->prev;
while(buffer && buffer->size == 0)
buffer = buffer->prev;
if(buffer == NULL) {
// panic!, this in not normal, something is very wrong
entry->state = MyCSS_TOKENIZER_STATE_SOLIDUS;
break;
}
if(buffer->data[ (buffer->size - 1) ] == '*') {
css_offset++;
token->length = (entry->current_buffer->offset + css_offset) - token->begin;
token->type = MyCSS_TOKEN_TYPE_COMMENT;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
break;
}
}
else if(css[ (css_offset - 1) ] == '*') {
css_offset++;
token->length = (entry->current_buffer->offset + css_offset) - token->begin;
token->type = MyCSS_TOKEN_TYPE_COMMENT;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
break;
}
}
++css_offset;
}
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+003A COLON (:)
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_colon(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_COLON;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+003B SEMICOLON (;)
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_semicolon(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_SEMICOLON;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+003C LESS-THAN SIGN (<)
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_less_than_sign(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(css[css_offset] == '!') {
css_offset++;
entry->state = MyCSS_TOKENIZER_STATE_LESS_THAN_SIGN_MINUS;
}
else {
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_DELIM;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
}
return css_offset;
}
size_t mycss_tokenizer_state_less_than_sign_minus(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(css[css_offset] == '-') {
css_offset++;
entry->state = MyCSS_TOKENIZER_STATE_LESS_THAN_SIGN_MINUS_MINUS;
}
else {
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_DELIM;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
css_offset = mycss_tokenizer_state_set_current_buffer_for_continue(entry, css_offset, 1);
}
return css_offset;
}
size_t mycss_tokenizer_state_less_than_sign_minus_minus(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(css[css_offset] == '-') {
css_offset++;
token->length = 3;
token->type = MyCSS_TOKEN_TYPE_CDO;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
}
else {
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_DELIM;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
css_offset = mycss_tokenizer_state_set_current_buffer_for_continue(entry, css_offset, 2);
}
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+0040 COMMERCIAL AT (@)
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_commercial_at(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(css[css_offset] == '-') {
css_offset++;
entry->state = MyCSS_TOKENIZER_STATE_COMMERCIAL_AT_MINUS;
}
else if(css[css_offset] == '\\') {
css_offset++;
entry->state = MyCSS_TOKENIZER_STATE_COMMERCIAL_AT_RSOLIDUS;
}
else if(mycss_begin_chars_state_map[ ((const unsigned char *)css)[css_offset] ] == MyCSS_TOKENIZER_STATE_NAME_START_CODE_POINT) {
css_offset++;
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_NAME;
entry->state_back = MyCSS_TOKENIZER_STATE_COMMERCIAL_AT_BACK;
}
else {
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_DELIM;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
}
return css_offset;
}
size_t mycss_tokenizer_state_commercial_at_minus(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(mycss_begin_chars_state_map[ ((const unsigned char *)css)[css_offset] ] == MyCSS_TOKENIZER_STATE_NAME_START_CODE_POINT) {
css_offset++;
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_NAME;
entry->state_back = MyCSS_TOKENIZER_STATE_COMMERCIAL_AT_BACK;
}
else if(css[css_offset] == '\\') {
css_offset++;
entry->state = MyCSS_TOKENIZER_STATE_COMMERCIAL_AT_MINUS_RSOLIDUS;
}
else {
token->length = ((entry->current_buffer->offset + css_offset) - token->begin) - 1;
token->type = MyCSS_TOKEN_TYPE_DELIM;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
css_offset = mycss_tokenizer_state_set_current_buffer_for_continue(entry, css_offset, 1);
}
return css_offset;
}
size_t mycss_tokenizer_state_commercial_at_minus_rsolidus(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(css[css_offset] == '\n' || css[css_offset] == '\r' || css[css_offset] == 0x0C) {
token->length = ((entry->current_buffer->offset + css_offset) - token->begin) - 2;
token->type = MyCSS_TOKEN_TYPE_DELIM;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
css_offset = mycss_tokenizer_state_set_current_buffer_for_continue(entry, css_offset, 2);
}
else {
css_offset++;
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_NAME;
entry->state_back = MyCSS_TOKENIZER_STATE_COMMERCIAL_AT_BACK;
}
return css_offset;
}
size_t mycss_tokenizer_state_commercial_at_rsolidus(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(css[css_offset] == '\n' || css[css_offset] == '\r' || css[css_offset] == 0x0C) {
token->length = ((entry->current_buffer->offset + css_offset) - token->begin) - 1;
token->type = MyCSS_TOKEN_TYPE_DELIM;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
css_offset = mycss_tokenizer_state_set_current_buffer_for_continue(entry, css_offset, 1);
}
else {
css_offset++;
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_NAME;
entry->state_back = MyCSS_TOKENIZER_STATE_COMMERCIAL_AT_BACK;
}
return css_offset;
}
size_t mycss_tokenizer_state_commercial_at_back(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
token->type = MyCSS_TOKEN_TYPE_AT_KEYWORD;
token->begin += 1;
token->length -= 1;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+005B LEFT SQUARE BRACKET ([)
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_left_square_bracket(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_LEFT_SQUARE_BRACKET;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+005C REVERSE SOLIDUS (\)
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_reverse_solidus(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(css[css_offset] == '\n' || css[css_offset] == '\r' || css[css_offset] == 0x0C) {
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_DELIM;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
}
else {
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_NAME;
entry->state_back = MyCSS_TOKENIZER_GLOBAL_STATE_IDENT;
}
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+005D RIGHT SQUARE BRACKET (])
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_right_square_bracket(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_RIGHT_SQUARE_BRACKET;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+005E CIRCUMFLEX ACCENT (^)
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_circumflex_accent(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(css[css_offset] == '=') {
css_offset++;
token->length = 2;
token->type = MyCSS_TOKEN_TYPE_PREFIX_MATCH;
}
else {
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_DELIM;
}
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+007B LEFT CURLY BRACKET ({)
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_left_curly_bracket(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_LEFT_CURLY_BRACKET;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+007D RIGHT CURLY BRACKET (})
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_right_curly_bracket(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_RIGHT_CURLY_BRACKET;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
return css_offset;
}
/////////////////////////////////////////////////////////
//// Digit
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_digit(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_NUMBER_DIGIT;
entry->state_back = MyCSS_TOKENIZER_GLOBAL_STATE_NUMERIC;
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+0055 LATIN CAPITAL LETTER U (U) || U+0075 LATIN SMALL LETTER U (u)
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_letter_u(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(css[css_offset] == '+') {
++css_offset;
if(css_offset >= css_size) {
entry->state = MyCSS_TOKENIZER_STATE_LETTER_U_NEXT;
return css_offset;
}
if(myhtml_string_chars_hex_map[ (const unsigned char)(css[css_offset]) ] != 0xff ||
css[css_offset] == '?')
{
token->begin += 2;
++css_offset;
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_UNICODE_RANGE_BEFORE;
}
else {
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_NAME;
entry->state_back = MyCSS_TOKENIZER_GLOBAL_STATE_IDENT;
}
}
else {
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_NAME;
entry->state_back = MyCSS_TOKENIZER_GLOBAL_STATE_IDENT;
}
return css_offset;
}
size_t mycss_tokenizer_state_letter_u_next(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(myhtml_string_chars_hex_map[ (const unsigned char)(css[css_offset]) ] != 0xff ||
css[css_offset] == '?')
{
token->begin += 2;
++css_offset;
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_UNICODE_RANGE_BEFORE;
}
else {
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_NAME;
entry->state_back = MyCSS_TOKENIZER_GLOBAL_STATE_IDENT;
}
return css_offset;
}
/////////////////////////////////////////////////////////
//// name-start code point
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_name_start_code_point(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
entry->state = MyCSS_TOKENIZER_GLOBAL_STATE_NAME;
entry->state_back = MyCSS_TOKENIZER_GLOBAL_STATE_IDENT;
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+007C VERTICAL LINE (|)
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_vertical_line(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(css[css_offset] == '=') {
css_offset++;
token->length = 2;
token->type = MyCSS_TOKEN_TYPE_DASH_MATCH;
}
else if(css[css_offset] == '|') {
css_offset++;
token->length = 2;
token->type = MyCSS_TOKEN_TYPE_COLUMN;
}
else {
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_DELIM;
}
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
return css_offset;
}
/////////////////////////////////////////////////////////
//// U+007E TILDE (~)
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_tilde(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
if(css[css_offset] == '=') {
css_offset++;
token->length = 2;
token->type = MyCSS_TOKEN_TYPE_INCLUDE_MATCH;
}
else {
token->length = 1;
token->type = MyCSS_TOKEN_TYPE_DELIM;
}
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
return css_offset;
}
/////////////////////////////////////////////////////////
//// anything else
////
/////////////////////////////////////////////////////////
size_t mycss_tokenizer_state_delim_single_code_point(mycss_entry_t* entry, mycss_token_t* token, const char* css, size_t css_offset, size_t css_size)
{
const unsigned char *u_css = (const unsigned char*)css;
while (css_offset < css_size)
{
if(u_css[css_offset] < 128)
{
token->length = (entry->current_buffer->offset + css_offset) - token->begin;
token->type = MyCSS_TOKEN_TYPE_DELIM;
MyCSS_TOKEN_READY_CALLBACK_FUNCTION(entry, token);
entry->state = MyCSS_TOKENIZER_STATE_DATA;
break;
}
css_offset++;
}
return css_offset;
}
/////////////////////////////////////////////////////////
//// init tokenizer
////
/////////////////////////////////////////////////////////
mycss_status_t mycss_tokenizer_state_init(mycss_t* mycss)
{
mycss->parse_state_func = (mycss_tokenizer_state_f*)myhtml_calloc((MyCSS_TOKENIZER_STATE_LAST_ENTRY * 2), sizeof(mycss_tokenizer_state_f));
if(mycss->parse_state_func == NULL)
return MyCSS_STATUS_ERROR_TOKENIZER_STATE_ALLOCATION;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_DATA] = mycss_tokenizer_state_data;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_WHITESPACE] = mycss_tokenizer_state_whitespace;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_QUOTATION_MARK] = mycss_tokenizer_state_quotation_mark;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_QUOTATION_MARK_BACK] = mycss_tokenizer_state_quotation_mark_back;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_NUMBER_SIGN] = mycss_tokenizer_state_number_sign;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_NUMBER_SIGN_NAME_BACK] = mycss_tokenizer_state_number_sign_name_back;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_NUMBER_SIGN_NAME_RSOLIDUS] = mycss_tokenizer_state_number_sign_name_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_DOLLAR_SIGN] = mycss_tokenizer_state_dollar_sign;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_APOSTROPHE] = mycss_tokenizer_state_apostrophe;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_APOSTROPHE_BACK] = mycss_tokenizer_state_apostrophe_back;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LEFT_PARENTHESIS] = mycss_tokenizer_state_left_parenthesis;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_RIGHT_PARENTHESIS] = mycss_tokenizer_state_right_parenthesis;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_ASTERISK] = mycss_tokenizer_state_asterisk;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_PLUS_SIGN] = mycss_tokenizer_state_plus_sign;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_PLUS_SIGN_FULL_STOP] = mycss_tokenizer_state_plus_sign_full_stop;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_COMMA] = mycss_tokenizer_state_comma;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_HYPHEN_MINUS] = mycss_tokenizer_state_hyphen_minus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_HYPHEN_MINUS_FULL_STOP] = mycss_tokenizer_state_hyphen_minus_full_stop;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_HYPHEN_MINUS_MINUS] = mycss_tokenizer_state_hyphen_minus_minus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_HYPHEN_MINUS_MINUS_RSOLIDUS] = mycss_tokenizer_state_hyphen_minus_minus_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_HYPHEN_MINUS_RSOLIDUS] = mycss_tokenizer_state_hyphen_minus_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_FULL_STOP] = mycss_tokenizer_state_full_stop;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_SOLIDUS] = mycss_tokenizer_state_solidus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_SOLIDUS_COMMENT_END] = mycss_tokenizer_state_solidus_comment_end;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_COLON] = mycss_tokenizer_state_colon;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_SEMICOLON] = mycss_tokenizer_state_semicolon;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LESS_THAN_SIGN] = mycss_tokenizer_state_less_than_sign;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LESS_THAN_SIGN_MINUS] = mycss_tokenizer_state_less_than_sign_minus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LESS_THAN_SIGN_MINUS_MINUS] = mycss_tokenizer_state_less_than_sign_minus_minus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_COMMERCIAL_AT] = mycss_tokenizer_state_commercial_at;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_COMMERCIAL_AT_MINUS] = mycss_tokenizer_state_commercial_at_minus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_COMMERCIAL_AT_MINUS_RSOLIDUS] = mycss_tokenizer_state_commercial_at_minus_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_COMMERCIAL_AT_RSOLIDUS] = mycss_tokenizer_state_commercial_at_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_COMMERCIAL_AT_BACK] = mycss_tokenizer_state_commercial_at_back;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LEFT_SQUARE_BRACKET] = mycss_tokenizer_state_left_square_bracket;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_REVERSE_SOLIDUS] = mycss_tokenizer_state_reverse_solidus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_RIGHT_SQUARE_BRACKET] = mycss_tokenizer_state_right_square_bracket;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_CIRCUMFLEX_ACCENT] = mycss_tokenizer_state_circumflex_accent;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LEFT_CURLY_BRACKET] = mycss_tokenizer_state_left_curly_bracket;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_RIGHT_CURLY_BRACKET] = mycss_tokenizer_state_right_curly_bracket;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_DIGIT] = mycss_tokenizer_state_digit;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LETTER_U] = mycss_tokenizer_state_letter_u;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LETTER_U_NEXT] = mycss_tokenizer_state_letter_u_next;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_NAME_START_CODE_POINT] = mycss_tokenizer_state_name_start_code_point;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_VERTICAL_LINE] = mycss_tokenizer_state_vertical_line;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_TILDE] = mycss_tokenizer_state_tilde;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_DELIM_SINGLE_CODE_POINT] = mycss_tokenizer_state_delim_single_code_point;
// global
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_BACK] = mycss_tokenizer_global_back;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_NUMERIC] = mycss_tokenizer_global_state_numeric;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_NUMERIC_MINUS] = mycss_tokenizer_global_state_numeric_minus;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_NUMERIC_MINUS_RSOLIDUS] = mycss_tokenizer_global_state_numeric_minus_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_NUMERIC_RSOLIDUS] = mycss_tokenizer_global_state_numeric_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_NUMBER_DIGIT] = mycss_tokenizer_global_state_number_digit;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_NUMBER_DOT] = mycss_tokenizer_global_state_number_dot;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_NUMBER_DECIMAL] = mycss_tokenizer_global_state_number_decimal;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_NUMBER_E] = mycss_tokenizer_global_state_number_e;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_NUMBER_E_PLUS_MINUS] = mycss_tokenizer_global_state_number_e_plus_minus;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_NUMBER_E_DECIMAL] = mycss_tokenizer_global_state_number_e_decimal;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_IDENT] = mycss_tokenizer_global_state_ident;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_URL] = mycss_tokenizer_global_state_url;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_URL_STRING_BACK] = mycss_tokenizer_global_state_url_string_back;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_URL_AFTER] = mycss_tokenizer_global_state_url_after;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_URL_AFTER_WHITESPACE] = mycss_tokenizer_global_state_url_after_whitespace;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_URL_RSOLIDUS] = mycss_tokenizer_global_state_url_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_BAD_URL] = mycss_tokenizer_global_state_bad_url;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_NAME] = mycss_tokenizer_global_state_name;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_NAME_RSOLIDUS] = mycss_tokenizer_global_state_name_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_STRING_DOUBLE_QUOTED] = mycss_tokenizer_global_state_string_double_quoted;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_STRING_DOUBLE_QUOTED_RSOLIDUS] = mycss_tokenizer_global_state_string_double_quoted_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_STRING_DOUBLE_QUOTED_RSOLIDUS_R] = mycss_tokenizer_global_state_string_double_quoted_rsolidus_r;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_STRING_SINGLE_QUOTED] = mycss_tokenizer_global_state_string_single_quoted;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_STRING_SINGLE_QUOTED_RSOLIDUS] = mycss_tokenizer_global_state_string_single_quoted_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_STRING_SINGLE_QUOTED_RSOLIDUS_R] = mycss_tokenizer_global_state_string_single_quoted_rsolidus_r;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_UNICODE_RANGE_BEFORE] = mycss_tokenizer_global_state_unicode_range_before;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_UNICODE_RANGE] = mycss_tokenizer_global_state_unicode_range;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_UNICODE_RANGE_QUESTION] = mycss_tokenizer_global_state_unicode_range_question;
mycss->parse_state_func[MyCSS_TOKENIZER_GLOBAL_STATE_UNICODE_RANGE_MINUS] = mycss_tokenizer_global_state_unicode_range_minus;
// end
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_WHITESPACE] = mycss_tokenizer_end_state_whitespace;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_QUOTATION_MARK] = mycss_tokenizer_end_state_quotation_mark;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_QUOTATION_MARK_BACK] = mycss_tokenizer_end_state_quotation_mark_back;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_NUMBER_SIGN] = mycss_tokenizer_end_state_number_sign;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_NUMBER_SIGN_NAME_BACK] = mycss_tokenizer_end_state_number_sign_name_back;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_NUMBER_SIGN_NAME_RSOLIDUS] = mycss_tokenizer_end_state_number_sign_name_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_DOLLAR_SIGN] = mycss_tokenizer_end_state_dollar_sign;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_APOSTROPHE] = mycss_tokenizer_end_state_apostrophe;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_APOSTROPHE_BACK] = mycss_tokenizer_end_state_apostrophe_back;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_LEFT_PARENTHESIS] = mycss_tokenizer_end_state_left_parenthesis;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_RIGHT_PARENTHESIS] = mycss_tokenizer_end_state_right_parenthesis;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_ASTERISK] = mycss_tokenizer_end_state_asterisk;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_PLUS_SIGN] = mycss_tokenizer_end_state_plus_sign;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_PLUS_SIGN_FULL_STOP] = mycss_tokenizer_end_state_plus_sign_full_stop;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_COMMA] = mycss_tokenizer_end_state_comma;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_HYPHEN_MINUS] = mycss_tokenizer_end_state_hyphen_minus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_HYPHEN_MINUS_FULL_STOP] = mycss_tokenizer_end_state_hyphen_minus_full_stop;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_HYPHEN_MINUS_MINUS] = mycss_tokenizer_end_state_hyphen_minus_minus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_HYPHEN_MINUS_MINUS_RSOLIDUS] = mycss_tokenizer_end_state_hyphen_minus_minus_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_HYPHEN_MINUS_RSOLIDUS] = mycss_tokenizer_end_state_hyphen_minus_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_FULL_STOP] = mycss_tokenizer_end_state_full_stop;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_SOLIDUS] = mycss_tokenizer_end_state_solidus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_SOLIDUS_COMMENT_END] = mycss_tokenizer_end_state_solidus_comment_end;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_COLON] = mycss_tokenizer_end_state_colon;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_SEMICOLON] = mycss_tokenizer_end_state_semicolon;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_LESS_THAN_SIGN] = mycss_tokenizer_end_state_less_than_sign;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_LESS_THAN_SIGN_MINUS] = mycss_tokenizer_end_state_less_than_sign_minus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_LESS_THAN_SIGN_MINUS_MINUS] = mycss_tokenizer_end_state_less_than_sign_minus_minus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_COMMERCIAL_AT] = mycss_tokenizer_end_state_commercial_at;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_COMMERCIAL_AT_MINUS] = mycss_tokenizer_end_state_commercial_at_minus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_COMMERCIAL_AT_MINUS_RSOLIDUS] = mycss_tokenizer_end_state_commercial_at_minus_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_COMMERCIAL_AT_RSOLIDUS] = mycss_tokenizer_end_state_commercial_at_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_COMMERCIAL_AT_BACK] = mycss_tokenizer_end_state_commercial_at_back;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_LEFT_SQUARE_BRACKET] = mycss_tokenizer_end_state_left_square_bracket;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_REVERSE_SOLIDUS] = mycss_tokenizer_end_state_reverse_solidus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_RIGHT_SQUARE_BRACKET] = mycss_tokenizer_end_state_right_square_bracket;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_CIRCUMFLEX_ACCENT] = mycss_tokenizer_end_state_circumflex_accent;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_LEFT_CURLY_BRACKET] = mycss_tokenizer_end_state_left_curly_bracket;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_RIGHT_CURLY_BRACKET] = mycss_tokenizer_end_state_right_curly_bracket;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_DIGIT] = mycss_tokenizer_end_state_digit;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_LETTER_U] = mycss_tokenizer_end_state_letter_u;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_LETTER_U_NEXT] = mycss_tokenizer_end_state_letter_u_next;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_NAME_START_CODE_POINT] = mycss_tokenizer_end_state_name_start_code_point;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_VERTICAL_LINE] = mycss_tokenizer_end_state_vertical_line;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_TILDE] = mycss_tokenizer_end_state_tilde;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_STATE_DELIM_SINGLE_CODE_POINT] = mycss_tokenizer_end_state_delim_single_code_point;
// global end
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_BACK] = mycss_tokenizer_end_global_back;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_NUMERIC] = mycss_tokenizer_end_global_state_numeric;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_NUMERIC_MINUS] = mycss_tokenizer_end_global_state_numeric_minus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_NUMERIC_MINUS_RSOLIDUS] = mycss_tokenizer_end_global_state_numeric_minus_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_NUMERIC_RSOLIDUS] = mycss_tokenizer_end_global_state_numeric_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_NUMBER_DIGIT] = mycss_tokenizer_end_global_state_number_digit;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_NUMBER_DOT] = mycss_tokenizer_end_global_state_number_dot;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_NUMBER_DECIMAL] = mycss_tokenizer_end_global_state_number_decimal;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_NUMBER_E] = mycss_tokenizer_end_global_state_number_e;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_NUMBER_E_PLUS_MINUS] = mycss_tokenizer_end_global_state_number_e_plus_minus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_NUMBER_E_DECIMAL] = mycss_tokenizer_end_global_state_number_e_decimal;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_IDENT] = mycss_tokenizer_end_global_state_ident;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_URL] = mycss_tokenizer_end_global_state_url;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_URL_STRING_BACK] = mycss_tokenizer_end_global_state_url_string_back;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_URL_AFTER] = mycss_tokenizer_end_global_state_url_after;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_URL_AFTER_WHITESPACE] = mycss_tokenizer_end_global_state_url_after_whitespace;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_URL_RSOLIDUS] = mycss_tokenizer_end_global_state_url_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_BAD_URL] = mycss_tokenizer_end_global_state_bad_url;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_NAME] = mycss_tokenizer_end_global_state_name;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_NAME_RSOLIDUS] = mycss_tokenizer_end_global_state_name_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_STRING_DOUBLE_QUOTED] = mycss_tokenizer_end_global_state_string_double_quoted;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_STRING_DOUBLE_QUOTED_RSOLIDUS] = mycss_tokenizer_end_global_state_string_double_quoted_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_STRING_DOUBLE_QUOTED_RSOLIDUS_R] = mycss_tokenizer_end_global_state_string_double_quoted_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_STRING_SINGLE_QUOTED] = mycss_tokenizer_end_global_state_string_single_quoted;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_STRING_SINGLE_QUOTED_RSOLIDUS] = mycss_tokenizer_end_global_state_string_single_quoted_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_STRING_SINGLE_QUOTED_RSOLIDUS_R] = mycss_tokenizer_end_global_state_string_single_quoted_rsolidus;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_UNICODE_RANGE_BEFORE] = mycss_tokenizer_end_global_state_unicode_range_before;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_UNICODE_RANGE] = mycss_tokenizer_end_global_state_unicode_range;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_UNICODE_RANGE_QUESTION] = mycss_tokenizer_end_global_state_unicode_range_question;
mycss->parse_state_func[MyCSS_TOKENIZER_STATE_LAST_ENTRY + MyCSS_TOKENIZER_GLOBAL_STATE_UNICODE_RANGE_MINUS] = mycss_tokenizer_end_global_state_unicode_range_minus;
return MyCSS_STATUS_OK;
}
void mycss_tokenizer_state_destroy(mycss_t* mycss)
{
if(mycss->parse_state_func) {
free(mycss->parse_state_func);
mycss->parse_state_func = NULL;
}
}