You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
517 lines
14 KiB
517 lines
14 KiB
/*****************************************************************************
|
|
* css_parser.c : CSS parser
|
|
*****************************************************************************
|
|
* Copyright (C) 2017 VideoLabs, VLC authors and VideoLAN
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify it
|
|
* under the terms of the GNU Lesser General Public License as published by
|
|
* the Free Software Foundation; either version 2.1 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public License
|
|
* along with this program; if not, write to the Free Software Foundation,
|
|
* Inc., 51 Franklin Street, Fifth Floor, Boston MA 02110-1301, USA.
|
|
*****************************************************************************/
|
|
#ifdef HAVE_CONFIG_H
|
|
# include "config.h"
|
|
#endif
|
|
|
|
#include <vlc_common.h>
|
|
|
|
#include "css_bridge.h"
|
|
#include "css_parser.h"
|
|
#include "CSSGrammar.h"
|
|
|
|
#include <ctype.h>
|
|
|
|
static void vlc_css_term_Debug( const vlc_css_term_t a, int depth );
|
|
static void vlc_css_expression_Debug( const vlc_css_expr_t *p_expr, int depth );
|
|
static void vlc_css_declarations_Debug( const vlc_css_declaration_t *p_decl, int depth );
|
|
static void vlc_css_selectors_Debug( const vlc_css_selector_t *p_sel, int depth );
|
|
static void vlc_css_rules_Debug( const vlc_css_rule_t *p_rule, int depth );
|
|
|
|
#define CHAIN_APPEND_IMPL(n, t) CHAIN_APPEND_DECL(n ,t)\
|
|
{\
|
|
t ** insert = &p_a->p_next;\
|
|
while( *insert ) insert = &((*insert)->p_next);\
|
|
*insert = p_b;\
|
|
}
|
|
|
|
void vlc_css_term_Clean( vlc_css_term_t a )
|
|
{
|
|
if( a.type >= TYPE_STRING )
|
|
free( a.psz );
|
|
|
|
if( a.type == TYPE_FUNCTION )
|
|
{
|
|
if( a.function )
|
|
vlc_css_expression_Delete( a.function );
|
|
}
|
|
}
|
|
|
|
static void vlc_css_term_Debug( const vlc_css_term_t a, int depth )
|
|
{
|
|
for(int i=0;i<depth;i++) printf(" ");
|
|
printf("term: ");
|
|
if( a.type >= TYPE_STRING )
|
|
{
|
|
printf("%x %s\n", a.type, a.psz);
|
|
if( a.type == TYPE_FUNCTION && a.function )
|
|
vlc_css_expression_Debug( a.function, depth + 1 );
|
|
}
|
|
else printf("%x %f\n", a.type, a.val);
|
|
}
|
|
|
|
bool vlc_css_expression_AddTerm( vlc_css_expr_t *p_expr,
|
|
char op, vlc_css_term_t a )
|
|
{
|
|
if( p_expr->i_count >= p_expr->i_alloc )
|
|
{
|
|
size_t i_realloc = (p_expr->i_alloc == 0) ? 1 : p_expr->i_alloc + 4;
|
|
void *reac = realloc( p_expr->seq, i_realloc * sizeof(p_expr->seq[0]) );
|
|
if( reac )
|
|
{
|
|
p_expr->seq = reac;
|
|
p_expr->i_alloc = i_realloc;
|
|
}
|
|
}
|
|
|
|
if( p_expr->i_count >= p_expr->i_alloc )
|
|
return false;
|
|
|
|
p_expr->seq[p_expr->i_count].op = op;
|
|
p_expr->seq[p_expr->i_count++].term = a;
|
|
return true;
|
|
}
|
|
|
|
void vlc_css_expression_Delete( vlc_css_expr_t *p_expr )
|
|
{
|
|
if( p_expr )
|
|
{
|
|
for(size_t i=0; i<p_expr->i_count; i++)
|
|
vlc_css_term_Clean( p_expr->seq[i].term );
|
|
free( p_expr->seq );
|
|
}
|
|
free( p_expr );
|
|
}
|
|
|
|
static void vlc_css_expression_Debug( const vlc_css_expr_t *p_expr, int depth )
|
|
{
|
|
if( p_expr )
|
|
{
|
|
for(int i=0;i<depth;i++) printf(" ");
|
|
printf("expression: \n");
|
|
for(size_t i=0; i<p_expr->i_count; i++)
|
|
vlc_css_term_Debug( p_expr->seq[i].term, depth + 1 );
|
|
}
|
|
}
|
|
|
|
vlc_css_expr_t * vlc_css_expression_New( vlc_css_term_t term )
|
|
{
|
|
vlc_css_expr_t *p_expr = calloc(1, sizeof(*p_expr));
|
|
if(!vlc_css_expression_AddTerm( p_expr, 0, term ))
|
|
{
|
|
free(p_expr);
|
|
p_expr = NULL;
|
|
}
|
|
return p_expr;
|
|
}
|
|
|
|
CHAIN_APPEND_IMPL(vlc_css_declarations_Append, vlc_css_declaration_t)
|
|
|
|
void vlc_css_declarations_Delete( vlc_css_declaration_t *p_decl )
|
|
{
|
|
while( p_decl )
|
|
{
|
|
vlc_css_declaration_t *p_next = p_decl->p_next;
|
|
vlc_css_expression_Delete( p_decl->expr );
|
|
free( p_decl->psz_property );
|
|
free( p_decl );
|
|
p_decl = p_next;
|
|
}
|
|
}
|
|
|
|
static void vlc_css_declarations_Debug( const vlc_css_declaration_t *p_decl, int depth )
|
|
{
|
|
while( p_decl )
|
|
{
|
|
for(int i=0;i<depth;i++) printf(" ");
|
|
printf("declaration: %s\n", p_decl->psz_property );
|
|
vlc_css_expression_Debug( p_decl->expr, depth + 1 );
|
|
p_decl = p_decl->p_next;
|
|
}
|
|
}
|
|
|
|
vlc_css_declaration_t * vlc_css_declaration_New( const char *psz )
|
|
{
|
|
vlc_css_declaration_t *p_decl = calloc(1, sizeof(*p_decl));
|
|
p_decl->psz_property = strdup(psz);
|
|
return p_decl;
|
|
}
|
|
|
|
CHAIN_APPEND_IMPL(vlc_css_selector_Append, vlc_css_selector_t)
|
|
|
|
void
|
|
vlc_css_selector_AddSpecifier( vlc_css_selector_t *p_sel, vlc_css_selector_t *p_spec )
|
|
{
|
|
*p_sel->specifiers.pp_append = p_spec;
|
|
while(p_spec)
|
|
{
|
|
p_sel->specifiers.pp_append = &p_spec->p_next;
|
|
p_spec = p_spec->p_next;
|
|
}
|
|
}
|
|
|
|
void vlc_css_selectors_Delete( vlc_css_selector_t *p_sel )
|
|
{
|
|
while( p_sel )
|
|
{
|
|
vlc_css_selector_t *p_next = p_sel->p_next;
|
|
free( p_sel->psz_name );
|
|
vlc_css_selectors_Delete( p_sel->specifiers.p_first );
|
|
vlc_css_selectors_Delete( p_sel->p_matchsel );
|
|
free( p_sel );
|
|
p_sel = p_next;
|
|
}
|
|
}
|
|
|
|
static void vlc_css_selectors_Debug( const vlc_css_selector_t *p_sel, int depth )
|
|
{
|
|
while( p_sel )
|
|
{
|
|
for(int i=0;i<depth;i++) printf(" "); printf("selector %c%s:\n", p_sel->combinator, p_sel->psz_name );
|
|
vlc_css_selectors_Debug( p_sel->p_matchsel, depth + 1 );
|
|
vlc_css_selectors_Debug( p_sel->specifiers.p_first, depth + 1 );
|
|
p_sel = p_sel->p_next;
|
|
}
|
|
}
|
|
|
|
vlc_css_selector_t * vlc_css_selector_New( int type, const char *psz )
|
|
{
|
|
vlc_css_selector_t *p_sel = calloc(1, sizeof(*p_sel));
|
|
p_sel->psz_name = strdup(psz);
|
|
p_sel->type = type;
|
|
p_sel->combinator = RELATION_SELF;
|
|
p_sel->specifiers.pp_append = &p_sel->specifiers.p_first;
|
|
return p_sel;
|
|
}
|
|
|
|
void vlc_css_rules_Delete( vlc_css_rule_t *p_rule )
|
|
{
|
|
while(p_rule)
|
|
{
|
|
vlc_css_rule_t *p_next = p_rule->p_next;
|
|
vlc_css_selectors_Delete( p_rule->p_selectors );
|
|
vlc_css_declarations_Delete( p_rule->p_declarations );
|
|
free(p_rule);
|
|
p_rule = p_next;
|
|
}
|
|
}
|
|
|
|
static void vlc_css_rules_Debug( const vlc_css_rule_t *p_rule, int depth )
|
|
{
|
|
int j = 0;
|
|
while(p_rule)
|
|
{
|
|
for(int i=0;i<depth;i++) printf(" "); printf("rule %d:\n", j++);
|
|
vlc_css_selectors_Debug( p_rule->p_selectors, depth + 1 );
|
|
vlc_css_declarations_Debug( p_rule->p_declarations, depth + 1 );
|
|
p_rule = p_rule->p_next;
|
|
}
|
|
}
|
|
|
|
vlc_css_rule_t * vlc_css_rule_New( void )
|
|
{
|
|
vlc_css_rule_t *p_rule = calloc(1, sizeof(*p_rule));
|
|
return p_rule;
|
|
}
|
|
|
|
void vlc_css_parser_AddRule( vlc_css_parser_t *p_parser,
|
|
vlc_css_rule_t *p_rule )
|
|
{
|
|
(*p_parser->rules.pp_append) = p_rule;
|
|
p_parser->rules.pp_append = &p_rule->p_next;
|
|
}
|
|
|
|
void vlc_css_parser_Debug( const vlc_css_parser_t *p_parser )
|
|
{
|
|
vlc_css_rules_Debug( p_parser->rules.p_first, 0 );
|
|
}
|
|
|
|
void vlc_css_parser_Clean( vlc_css_parser_t *p_parser )
|
|
{
|
|
vlc_css_rules_Delete( p_parser->rules.p_first );
|
|
}
|
|
|
|
void vlc_css_parser_Init( vlc_css_parser_t *p_parser )
|
|
{
|
|
memset(p_parser, 0, sizeof(vlc_css_parser_t));
|
|
p_parser->rules.pp_append = &p_parser->rules.p_first;
|
|
}
|
|
|
|
bool vlc_css_parser_ParseBytes( vlc_css_parser_t *p_parser, const uint8_t *p_data, size_t i_data )
|
|
{
|
|
yyscan_t yy;
|
|
csslex_init(&yy);
|
|
|
|
YY_BUFFER_STATE buf = css_scan_bytes( (const char*) p_data, i_data, yy );
|
|
|
|
bool b_ret = !cssparse( yy, p_parser );
|
|
|
|
css_delete_buffer( buf, yy );
|
|
csslex_destroy( yy );
|
|
|
|
return b_ret;
|
|
}
|
|
|
|
bool vlc_css_parser_ParseString( vlc_css_parser_t *p_parser, const char *psz_css )
|
|
{
|
|
yyscan_t yy;
|
|
csslex_init(&yy);
|
|
|
|
YY_BUFFER_STATE buf = css_scan_string( psz_css, yy );
|
|
|
|
bool b_ret = !cssparse( yy, p_parser );
|
|
|
|
css_delete_buffer( buf, yy );
|
|
csslex_destroy( yy );
|
|
|
|
return b_ret;
|
|
}
|
|
|
|
static int CodePointToUTF8( uint32_t ucs4, char *p )
|
|
{
|
|
/* adapted from codepoint conversion from strings.h */
|
|
if( ucs4 <= 0x7F )
|
|
{
|
|
p[0] = ucs4;
|
|
return 1;
|
|
}
|
|
else if( ucs4 <= 0x7FF )
|
|
{
|
|
p[0] = 0xC0 | (ucs4 >> 6);
|
|
p[1] = 0x80 | (ucs4 & 0x3F);
|
|
return 2;
|
|
}
|
|
else if( ucs4 <= 0xFFFF )
|
|
{
|
|
p[0] = 0xE0 | (ucs4 >> 12);
|
|
p[1] = 0x80 | ((ucs4 >> 6) & 0x3F);
|
|
p[2] = 0x80 | (ucs4 & 0x3F);
|
|
return 3;
|
|
}
|
|
else if( ucs4 <= 0x1FFFFF )
|
|
{
|
|
p[0] = 0xF0 | (ucs4 >> 18);
|
|
p[1] = 0x80 | ((ucs4 >> 12) & 0x3F);
|
|
p[2] = 0x80 | ((ucs4 >> 6) & 0x3F);
|
|
p[3] = 0x80 | (ucs4 & 0x3F);
|
|
return 4;
|
|
}
|
|
else if( ucs4 <= 0x3FFFFFF )
|
|
{
|
|
p[0] = 0xF8 | (ucs4 >> 24);
|
|
p[1] = 0x80 | ((ucs4 >> 18) & 0x3F);
|
|
p[2] = 0x80 | ((ucs4 >> 12) & 0x3F);
|
|
p[3] = 0x80 | ((ucs4 >> 6) & 0x3F);
|
|
p[4] = 0x80 | (ucs4 & 0x3F);
|
|
return 5;
|
|
}
|
|
else
|
|
{
|
|
p[0] = 0xFC | (ucs4 >> 30);
|
|
p[1] = 0x80 | ((ucs4 >> 24) & 0x3F);
|
|
p[2] = 0x80 | ((ucs4 >> 18) & 0x3F);
|
|
p[3] = 0x80 | ((ucs4 >> 12) & 0x3F);
|
|
p[4] = 0x80 | ((ucs4 >> 6) & 0x3F);
|
|
p[5] = 0x80 | (ucs4 & 0x3F);
|
|
return 6;
|
|
}
|
|
}
|
|
|
|
void vlc_css_unescape( char *psz )
|
|
{
|
|
if( !psz )
|
|
return;
|
|
char *r = psz;
|
|
char *w = psz;
|
|
|
|
while( *r )
|
|
{
|
|
if( *r == '\\' )
|
|
{
|
|
r++;
|
|
/* newlines */
|
|
if( *r == 0 )
|
|
{
|
|
break;
|
|
}
|
|
else if( strchr( "nfr", *r ) )
|
|
{
|
|
switch( r[0] )
|
|
{
|
|
case 'n':
|
|
*w++ = '\n';
|
|
r++;
|
|
break;
|
|
case 'r':
|
|
*w++ = '\r';
|
|
if( r[1] && r[1] == 'n' )
|
|
{
|
|
*w++ = '\n';
|
|
r++;
|
|
}
|
|
r++;
|
|
break;
|
|
case 'f':
|
|
*w++ = '\f';
|
|
r++;
|
|
break;
|
|
}
|
|
}
|
|
else if( isxdigit( *r ) )
|
|
{
|
|
const char *p_start = r;
|
|
int i;
|
|
for( i=0; i<6 && *r && isxdigit( *r ); i++ )
|
|
r++;
|
|
const char backup = *r;
|
|
*r = 0;
|
|
unsigned i_value = strtoul( p_start, NULL, 16 );
|
|
*r = backup;
|
|
if( i < 6 && *r && *r == ' ' )
|
|
r++;
|
|
w += CodePointToUTF8( i_value, w );
|
|
}
|
|
}
|
|
else
|
|
{
|
|
*w++ = *r++;
|
|
}
|
|
}
|
|
|
|
*w = 0;
|
|
}
|
|
|
|
char * vlc_css_unescaped( const char *psz )
|
|
{
|
|
char *psz_ret = strdup( psz );
|
|
vlc_css_unescape( psz_ret );
|
|
return psz_ret;
|
|
}
|
|
|
|
char * vlc_css_unquoted( const char *psz )
|
|
{
|
|
char *psz_ret;
|
|
if( *psz == '\'' || *psz == '\"' )
|
|
{
|
|
size_t i_len = strlen(psz);
|
|
if( psz[i_len - 1] == psz[0] )
|
|
psz_ret = strndup( psz + 1, i_len - 2 );
|
|
else
|
|
psz_ret = strdup( psz );
|
|
}
|
|
else
|
|
{
|
|
psz_ret = strdup( psz );
|
|
}
|
|
return psz_ret;
|
|
}
|
|
|
|
|
|
char * vlc_css_unquotedunescaped( const char *psz )
|
|
{
|
|
char *psz_ret = vlc_css_unquoted( psz );
|
|
if( psz_ret )
|
|
vlc_css_unescape( psz_ret );
|
|
return psz_ret;
|
|
}
|
|
|
|
#ifdef CSS_PARSER_DEBUG
|
|
|
|
|
|
static void css_properties_Debug( const vlc_css_declaration_t *p_decl )
|
|
{
|
|
printf("set %s to ", p_decl->psz_property);
|
|
for( size_t i=0; i<p_decl->expr->i_count; i++ )
|
|
{
|
|
printf("term %s ", p_decl->expr->seq[i].term.psz);
|
|
}
|
|
printf("\n");
|
|
}
|
|
|
|
void css_selector_Debug( const vlc_css_selector_t *p_sel )
|
|
{
|
|
printf("select its ");
|
|
switch( p_sel->combinator )
|
|
{
|
|
case RELATION_DESCENDENT:
|
|
printf("descendent");
|
|
break;
|
|
case RELATION_DIRECTADJACENT:
|
|
printf("adjacent");
|
|
break;
|
|
case RELATION_INDIRECTADJACENT:
|
|
printf("indirect adjacent");
|
|
break;
|
|
case RELATION_CHILD:
|
|
printf("child");
|
|
break;
|
|
case RELATION_SELF:
|
|
break;
|
|
}
|
|
|
|
printf(" nodes matching filter: ");
|
|
switch( p_sel->type )
|
|
{
|
|
case SELECTOR_SIMPLE:
|
|
printf("<%s>\n", p_sel->psz_name);
|
|
break;
|
|
case SELECTOR_PSEUDOCLASS:
|
|
printf(":%s\n", p_sel->psz_name);
|
|
break;
|
|
case SELECTOR_PSEUDOELEMENT:
|
|
printf("::%s\n", p_sel->psz_name);
|
|
break;
|
|
case SPECIFIER_ID:
|
|
printf("%s\n", p_sel->psz_name);
|
|
break;
|
|
case SPECIFIER_CLASS:
|
|
printf(".%s\n", p_sel->psz_name);
|
|
break;
|
|
case SPECIFIER_ATTRIB:
|
|
printf("[%s]\n", p_sel->psz_name);
|
|
break;
|
|
}
|
|
}
|
|
|
|
void css_rule_Debug( const vlc_css_rule_t *p_rule )
|
|
{
|
|
if( p_rule == NULL )
|
|
return;
|
|
printf("add for rule nodes:\n");
|
|
for( const vlc_css_selector_t *p_sel = p_rule->p_selectors;
|
|
p_sel; p_sel = p_sel->p_next )
|
|
{
|
|
css_selector_Debug( p_sel );
|
|
for( const vlc_css_selector_t *p_spec = p_sel->specifiers.p_first;
|
|
p_spec; p_spec = p_spec->p_next )
|
|
css_selector_Debug( p_spec );
|
|
|
|
if( p_sel->p_next )
|
|
printf("add nodes\n");
|
|
}
|
|
|
|
for( const vlc_css_declaration_t *p_decl = p_rule->p_declarations;
|
|
p_decl; p_decl = p_decl->p_next )
|
|
{
|
|
css_properties_Debug( p_decl );
|
|
}
|
|
}
|
|
|
|
#endif
|
|
|