/* * Copyright (C) 2009-2011 Vincent Hanquez * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU Lesser General Public License as published * by the Free Software Foundation; version 2.1 or version 3.0 only. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. */ /* * the class, states and state transition tables has been inspired by the JSON_parser.c * available at http://json.org, but are quite different on the way that the * parser handles its parse buffer and contains significant differences that affect * the JSON compliance. */ #include "pa_json.h" enum classes { C_SPACE, /* space */ C_NL, /* newline */ C_WHITE, /* tab, CR */ C_LCURB, C_RCURB, /* object opening/closing */ C_LSQRB, C_RSQRB, /* array opening/closing */ /* syntax symbols */ C_COLON, C_COMMA, C_QUOTE, /* " */ C_BACKS, /* \ */ C_SLASH, /* / */ C_PLUS, C_MINUS, C_DOT, C_ZERO, C_DIGIT, /* digits */ C_a, C_b, C_c, C_d, C_e, C_f, C_l, C_n, C_r, C_s, C_t, C_u, /* nocaps letters */ C_ABCDF, C_E, /* caps letters */ C_OTHER, /* all other */ C_STAR, /* star in C style comment */ C_HASH, /* # for YAML comment */ C_ERROR = 0xfe, }; /* map from character < 128 to classes. from 128 to 256 all C_OTHER */ static uint8_t character_class[128] = { C_ERROR, C_ERROR, C_ERROR, C_ERROR, C_ERROR, C_ERROR, C_ERROR, C_ERROR, C_ERROR, C_WHITE, C_NL, C_ERROR, C_ERROR, C_WHITE, C_ERROR, C_ERROR, C_ERROR, C_ERROR, C_ERROR, C_ERROR, C_ERROR, C_ERROR, C_ERROR, C_ERROR, C_ERROR, C_ERROR, C_ERROR, C_ERROR, C_ERROR, C_ERROR, C_ERROR, C_ERROR, C_SPACE, C_OTHER, C_QUOTE, C_HASH, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_STAR, C_PLUS, C_COMMA, C_MINUS, C_DOT, C_SLASH, C_ZERO, C_DIGIT, C_DIGIT, C_DIGIT, C_DIGIT, C_DIGIT, C_DIGIT, C_DIGIT, C_DIGIT, C_DIGIT, C_COLON, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_ABCDF, C_ABCDF, C_ABCDF, C_ABCDF, C_E, C_ABCDF, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_LSQRB, C_BACKS, C_RSQRB, C_OTHER, C_OTHER, C_OTHER, C_a, C_b, C_c, C_d, C_e, C_f, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_l, C_OTHER, C_n, C_OTHER, C_OTHER, C_OTHER, C_r, C_s, C_t, C_u, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_OTHER, C_LCURB, C_OTHER, C_RCURB, C_OTHER, C_OTHER }; /* define all states and actions that will be taken on each transition. * * states are defined first because of the fact they are use as index in the * transitions table. they usually contains either a number or a prefix _ * for simple state like string, object, value ... * * actions are defined starting from 0x80. state error is defined as 0xff */ enum states { STATE_GO, /* start */ STATE_OK, /* ok */ STATE_OO, /* object */ STATE_KK, /* key */ STATE_CO, /* colon */ STATE_VV, /* value */ STATE_AA, /* array */ STATE_SS, /* string */ STATE_E0, /* escape */ STATE_U1, STATE_U2, STATE_U3, STATE_U4, /* unicode states */ STATE_M0, STATE_Z0, STATE_I0, /* number states */ STATE_R1, STATE_R2, /* real states (after-dot digits) */ STATE_X1, STATE_X2, STATE_X3, /* exponant states */ STATE_T1, STATE_T2, STATE_T3, /* true constant states */ STATE_F1, STATE_F2, STATE_F3, STATE_F4, /* false constant states */ STATE_N1, STATE_N2, STATE_N3, /* null constant states */ STATE_C1, STATE_C2, STATE_C3, /* C-comment states */ STATE_Y1, /* YAML-comment state */ STATE_D1, STATE_D2, /* multi unicode states */ }; /* the following are actions that need to be taken */ enum actions { STATE_KS = 0x80, /* key separator */ STATE_SP, /* comma separator */ STATE_AB, /* array begin */ STATE_AE, /* array ending */ STATE_OB, /* object begin */ STATE_OE, /* object end */ STATE_CB, /* C-comment begin */ STATE_YB, /* YAML-comment begin */ STATE_CE, /* YAML/C comment end */ STATE_FA, /* false */ STATE_TR, /* true */ STATE_NU, /* null */ STATE_DE, /* double detected by exponent */ STATE_DF, /* double detected by . */ STATE_SE, /* string end */ STATE_MX, /* integer detected by minus */ STATE_ZX, /* integer detected by zero */ STATE_IX, /* integer detected by 1-9 */ STATE_UC, /* Unicode character read */ }; /* some compilers have the following names defined */ #undef _C2 #undef ST_ #undef PT_ /* error state */ #define STATE___ 0xff #define NR_STATES (STATE_D2 + 1) #define NR_CLASSES (C_HASH + 1) #define IS_STATE_ACTION(s) ((s) & 0x80) #define ST_(x) STATE##x #define PT_(a,b,c,d,e,f,g,h,i,j,k,l,m,n,o,p,q,r,s,t,u,v,w,x,y,z,a1,b1,c1,d1,e1,f1,g1,h1) \ { ST_(a),ST_(b),ST_(c),ST_(d),ST_(e),ST_(f),ST_(g),ST_(h),ST_(i),ST_(j),ST_(k),ST_(l),ST_(m),ST_(n), \ ST_(o),ST_(p),ST_(q),ST_(r),ST_(s),ST_(t),ST_(u),ST_(v),ST_(w),ST_(x),ST_(y),ST_(z),ST_(a1),ST_(b1), \ ST_(c1),ST_(d1),ST_(e1),ST_(f1),ST_(g1),ST_(h1) } /* map from the (previous state+new character class) to the next parser transition */ static const uint8_t state_transition_table[NR_STATES][NR_CLASSES] = { /* white ABCDF other */ /* sp nl | { } [ ] : , " \ / + - . 0 19 a b c d e f l n r s t u | E | * # */ /*GO*/ PT_(_GO,_GO,_GO,_OB,___,_AB,___,___,___,___,___,_CB,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_YB), /*OK*/ PT_(_OK,_OK,_OK,___,_OE,___,_AE,___,_SP,___,___,_CB,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_YB), /*OO*/ PT_(_OO,_OO,_OO,___,_OE,___,___,___,___,_SS,___,_CB,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_YB), /*KK*/ PT_(_KK,_KK,_KK,___,___,___,___,___,___,_SS,___,_CB,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_YB), /*CO*/ PT_(_CO,_CO,_CO,___,___,___,___,_KS,___,___,___,_CB,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_YB), /*VV*/ PT_(_VV,_VV,_VV,_OB,___,_AB,___,___,___,_SS,___,_CB,___,_MX,___,_ZX,_IX,___,___,___,___,___,_F1,___,_N1,___,___,_T1,___,___,___,___,___,_YB), /*AA*/ PT_(_AA,_AA,_AA,_OB,___,_AB,_AE,___,___,_SS,___,_CB,___,_MX,___,_ZX,_IX,___,___,___,___,___,_F1,___,_N1,___,___,_T1,___,___,___,___,___,_YB), /**************************************************************************************************************************************************/ /*SS*/ PT_(_SS,___,___,_SS,_SS,_SS,_SS,_SS,_SS,_SE,_E0,_SS,_SS,_SS,_SS,_SS,_SS,_SS,_SS,_SS,_SS,_SS,_SS,_SS,_SS,_SS,_SS,_SS,_SS,_SS,_SS,_SS,_SS,_SS), /*E0*/ PT_(___,___,___,___,___,___,___,___,___,_SS,_SS,_SS,___,___,___,___,___,___,_SS,___,___,___,_SS,___,_SS,_SS,___,_SS,_U1,___,___,___,___,___), /*U1*/ PT_(___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_U2,_U2,_U2,_U2,_U2,_U2,_U2,_U2,___,___,___,___,___,___,_U2,_U2,___,___,___), /*U2*/ PT_(___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_U3,_U3,_U3,_U3,_U3,_U3,_U3,_U3,___,___,___,___,___,___,_U3,_U3,___,___,___), /*U3*/ PT_(___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_U4,_U4,_U4,_U4,_U4,_U4,_U4,_U4,___,___,___,___,___,___,_U4,_U4,___,___,___), /*U4*/ PT_(___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_UC,_UC,_UC,_UC,_UC,_UC,_UC,_UC,___,___,___,___,___,___,_UC,_UC,___,___,___), /**************************************************************************************************************************************************/ /*M0*/ PT_(___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_Z0,_I0,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___), /*Z0*/ PT_(_OK,_OK,_OK,___,_OE,___,_AE,___,_SP,___,___,_CB,___,___,_DF,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_YB), /*I0*/ PT_(_OK,_OK,_OK,___,_OE,___,_AE,___,_SP,___,___,_CB,___,___,_DF,_I0,_I0,___,___,___,___,_DE,___,___,___,___,___,___,___,___,_DE,___,___,_YB), /*R1*/ PT_(___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_R2,_R2,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___), /*R2*/ PT_(_OK,_OK,_OK,___,_OE,___,_AE,___,_SP,___,___,_CB,___,___,___,_R2,_R2,___,___,___,___,_X1,___,___,___,___,___,___,___,___,_X1,___,___,_YB), /*X1*/ PT_(___,___,___,___,___,___,___,___,___,___,___,___,_X2,_X2,___,_X3,_X3,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___), /*X2*/ PT_(___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_X3,_X3,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___), /*X3*/ PT_(_OK,_OK,_OK,___,_OE,___,_AE,___,_SP,___,___,___,___,___,___,_X3,_X3,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___), /**************************************************************************************************************************************************/ /*T1*/ PT_(___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_T2,___,___,___,___,___,___,___,___), /*T2*/ PT_(___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_T3,___,___,___,___,___), /*T3*/ PT_(___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_TR,___,___,___,___,___,___,___,___,___,___,___,___), /*F1*/ PT_(___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_F2,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___), /*F2*/ PT_(___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_F3,___,___,___,___,___,___,___,___,___,___), /*F3*/ PT_(___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_F4,___,___,___,___,___,___,___), /*F4*/ PT_(___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_FA,___,___,___,___,___,___,___,___,___,___,___,___), /*N1*/ PT_(___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_N2,___,___,___,___,___), /*N2*/ PT_(___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_N3,___,___,___,___,___,___,___,___,___,___), /*N3*/ PT_(___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_NU,___,___,___,___,___,___,___,___,___,___), /**************************************************************************************************************************************************/ /*C1*/ PT_(___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_C2,___), /*C2*/ PT_(_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C3,_C2), /*C3*/ PT_(_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_CE,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C2,_C3,_C2), /*Y1*/ PT_(_Y1,_CE,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1,_Y1), /*D1*/ PT_(___,___,___,___,___,___,___,___,___,___,_D2,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___), /*D2*/ PT_(___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,___,_U1,___,___,___,___,___), }; /* map from (previous state+new character class) to the buffer policy. ignore=0/append=1/escape=2 */ static const uint8_t buffer_policy_table[NR_STATES][NR_CLASSES] = { /* white ABCDF other */ /* sp nl | { } [ ] : , " \ / + - . 0 19 a b c d e f l n r s t u | E | * # */ /*GO*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*OK*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*OO*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*KK*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*CO*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*VV*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*AA*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /**************************************************************************************************************/ /*SS*/ { 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1 }, /*E0*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 2, 2, 2, 0, 0, 0, 0, 0, 0, 2, 0, 0, 0, 2, 0, 2, 2, 0, 2, 0, 0, 0, 0, 0, 0 }, /*U1*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0 }, /*U2*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0 }, /*U3*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0 }, /*U4*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0 }, /**************************************************************************************************************/ /*M0*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*Z0*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*I0*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0 }, /*R1*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*R2*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0 }, /*X1*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*X2*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*X3*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /**************************************************************************************************************/ /*T1*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*T2*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*T3*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*F1*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*F2*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*F3*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*F4*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*N1*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*N2*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*N3*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /**************************************************************************************************************/ /*C1*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*C2*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*C3*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*Y1*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*D1*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /*D2*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, }; #define MODE_ARRAY 0 #define MODE_OBJECT 1 #define parser_malloc(parser, s) parser->config.user_malloc(s) #define parser_realloc(parser, p, s) parser->config.user_realloc(p, s) #define parser_free(parser, p) parser->config.user_free(p) static int state_grow(json_parser *parser) { uint32_t newsize = parser->stack_size * 2; void *ptr; if (parser->config.max_nesting != 0) return JSON_ERROR_NESTING_LIMIT; ptr = parser_realloc(parser, parser->stack, newsize * sizeof(uint8_t)); if (!ptr) return JSON_ERROR_NO_MEMORY; parser->stack = (uint8_t *)ptr; parser->stack_size = newsize; return 0; } static int state_push(json_parser *parser, uint8_t mode) { if (parser->stack_offset >= parser->stack_size) { int ret = state_grow(parser); if (ret) return ret; } parser->stack[parser->stack_offset++] = mode; return 0; } static int state_pop(json_parser *parser, uint8_t mode) { if (parser->stack_offset == 0) return JSON_ERROR_POP_EMPTY; parser->stack_offset--; if (parser->stack[parser->stack_offset] != mode) return JSON_ERROR_POP_UNEXPECTED_MODE; return 0; } static int buffer_grow(json_parser *parser) { uint32_t newsize; void *ptr; uint32_t max = parser->config.max_data; if (max > 0 && parser->buffer_size == max) return JSON_ERROR_DATA_LIMIT; newsize = parser->buffer_size * 2; if (max > 0 && newsize > max) newsize = max; ptr = parser_realloc(parser, parser->buffer, newsize * sizeof(char)); if (!ptr) return JSON_ERROR_NO_MEMORY; parser->buffer = (char *)ptr; parser->buffer_size = newsize; return 0; } static int buffer_push(json_parser *parser, unsigned char c) { int ret; if (parser->buffer_offset + 1 >= parser->buffer_size) { ret = buffer_grow(parser); if (ret) return ret; } parser->buffer[parser->buffer_offset++] = c; return 0; } static int do_callback_withbuf(json_parser *parser, int type) { if (!parser->callback) return 0; parser->buffer[parser->buffer_offset] = '\0'; return (*parser->callback)(parser->userdata, type, parser->buffer, parser->buffer_offset); } static int do_callback(json_parser *parser, int type) { if (!parser->callback) return 0; return (*parser->callback)(parser->userdata, type, NULL, 0); } static int do_buffer(json_parser *parser) { int ret = 0; switch (parser->type) { case JSON_KEY: case JSON_STRING: case JSON_FLOAT: case JSON_INT: case JSON_NULL: case JSON_TRUE: case JSON_FALSE: ret = do_callback_withbuf(parser, parser->type); if (ret) return ret; break; default: break; } parser->buffer_offset = 0; return ret; } static const uint8_t hextable[] = { 255,255,255,255,255,255,255,255,255,255,255,255,255,255,255,255, 255,255,255,255,255,255,255,255,255,255,255,255,255,255,255,255, 255,255,255,255,255,255,255,255,255,255,255,255,255,255,255,255, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9,255,255,255,255,255,255, 255, 10, 11, 12, 13, 14, 15,255,255,255,255,255,255,255,255,255, 255,255,255,255,255,255,255,255,255,255,255,255,255,255,255,255, 255, 10, 11, 12, 13, 14, 15,255,255,255,255,255,255,255,255,255, 255,255,255,255,255,255,255,255,255,255,255,255,255,255,255,255, }; #define hex(c) (hextable[(uint8_t) c]) /* high surrogate range from d800 to dbff */ /* low surrogate range dc00 to dfff */ #define IS_HIGH_SURROGATE(uc) (((uc) & 0xfc00) == 0xd800) #define IS_LOW_SURROGATE(uc) (((uc) & 0xfc00) == 0xdc00) /* transform an unicode [0-9A-Fa-f]{4} sequence into a proper value */ static int decode_unicode_char(json_parser *parser) { uint32_t uval; char *b = parser->buffer; uint32_t offset = parser->buffer_offset; uval = (hex(b[offset - 4]) << 12) | (hex(b[offset - 3]) << 8) | (hex(b[offset - 2]) << 4) | hex(b[offset - 1]); parser->buffer_offset -= 4; /* fast case */ if (!parser->unicode_multi && uval < 0x80) { b[parser->buffer_offset++] = (char) uval; return 0; } if (parser->unicode_multi) { if (!IS_LOW_SURROGATE(uval)) return JSON_ERROR_UNICODE_MISSING_LOW_SURROGATE; uval = 0x10000 + ((parser->unicode_multi & 0x3ff) << 10) + (uval & 0x3ff); b[parser->buffer_offset++] = (char) ((uval >> 18) | 0xf0); b[parser->buffer_offset++] = (char) (((uval >> 12) & 0x3f) | 0x80); b[parser->buffer_offset++] = (char) (((uval >> 6) & 0x3f) | 0x80); b[parser->buffer_offset++] = (char) ((uval & 0x3f) | 0x80); parser->unicode_multi = 0; return 0; } if (IS_LOW_SURROGATE(uval)) return JSON_ERROR_UNICODE_UNEXPECTED_LOW_SURROGATE; if (IS_HIGH_SURROGATE(uval)) { parser->unicode_multi = (uint16_t)uval; return 0; } if (uval < 0x800) { b[parser->buffer_offset++] = (char) ((uval >> 6) | 0xc0); b[parser->buffer_offset++] = (char) ((uval & 0x3f) | 0x80); } else { b[parser->buffer_offset++] = (char) ((uval >> 12) | 0xe0); b[parser->buffer_offset++] = (char) (((uval >> 6) & 0x3f) | 0x80); b[parser->buffer_offset++] = (char) (((uval >> 0) & 0x3f) | 0x80); } return 0; } static int buffer_push_escape(json_parser *parser, unsigned char next) { char c = '\0'; switch (next) { case 'b': c = '\b'; break; case 'f': c = '\f'; break; case 'n': c = '\n'; break; case 'r': c = '\r'; break; case 't': c = '\t'; break; case '"': c = '"'; break; case '/': c = '/'; break; case '\\': c = '\\'; break; } /* push the escaped character */ return buffer_push(parser, c); } #define CHK(f) { ret = f; if (ret) return ret; } static int act_uc(json_parser *parser) { int ret; CHK(decode_unicode_char(parser)); parser->state = (uint8_t)((parser->unicode_multi) ? STATE_D1 : STATE_SS); return 0; } static int act_yb(json_parser *parser) { if (!parser->config.allow_yaml_comments) return JSON_ERROR_COMMENT_NOT_ALLOWED; parser->save_state = parser->state; return 0; } static int act_cb(json_parser *parser) { if (!parser->config.allow_c_comments) return JSON_ERROR_COMMENT_NOT_ALLOWED; parser->save_state = parser->state; return 0; } static int act_ce(json_parser *parser) { parser->state = (parser->save_state > STATE_AA) ? (uint8_t)(STATE_OK) : (uint8_t)(parser->save_state); return 0; } static int act_ob(json_parser *parser) { int ret; CHK(do_callback(parser, JSON_OBJECT_BEGIN)); CHK(state_push(parser, MODE_OBJECT)); parser->expecting_key = 1; return 0; } static int act_oe(json_parser *parser) { int ret; CHK(state_pop(parser, MODE_OBJECT)); CHK(do_callback(parser, JSON_OBJECT_END)); parser->expecting_key = 0; return 0; } static int act_ab(json_parser *parser) { int ret; CHK(do_callback(parser, JSON_ARRAY_BEGIN)); CHK(state_push(parser, MODE_ARRAY)); return 0; } static int act_ae(json_parser *parser) { int ret; CHK(state_pop(parser, MODE_ARRAY)); CHK(do_callback(parser, JSON_ARRAY_END)); return 0; } static int act_se(json_parser *parser) { int ret; CHK(do_callback_withbuf(parser, (parser->expecting_key) ? JSON_KEY : JSON_STRING)); parser->buffer_offset = 0; parser->state = (uint8_t)((parser->expecting_key) ? STATE_CO : STATE_OK); parser->expecting_key = 0; return 0; } static int act_sp(json_parser *parser) { if (parser->stack_offset == 0) return JSON_ERROR_COMMA_OUT_OF_STRUCTURE; if (parser->stack[parser->stack_offset - 1] == MODE_OBJECT) { parser->expecting_key = 1; parser->state = STATE_KK; } else parser->state = STATE_VV; return 0; } struct action_descr { int (*call)(json_parser *parser); json_type type; uint8_t state; /* 0 if we let the callback set the value it want */ uint8_t dobuffer; }; static struct action_descr actions_map[] = { { NULL, JSON_NONE, STATE_VV, 0 }, /* KS */ { act_sp, JSON_NONE, 0, 1 }, /* SP */ { act_ab, JSON_NONE, STATE_AA, 0 }, /* AB */ { act_ae, JSON_NONE, STATE_OK, 1 }, /* AE */ { act_ob, JSON_NONE, STATE_OO, 0 }, /* OB */ { act_oe, JSON_NONE, STATE_OK, 1 }, /* OE */ { act_cb, JSON_NONE, STATE_C1, 1 }, /* CB */ { act_yb, JSON_NONE, STATE_Y1, 1 }, /* YB */ { act_ce, JSON_NONE, 0, 0 }, /* CE */ { NULL, JSON_FALSE, STATE_OK, 0 }, /* FA */ { NULL, JSON_TRUE, STATE_OK, 0 }, /* TR */ { NULL, JSON_NULL, STATE_OK, 0 }, /* NU */ { NULL, JSON_FLOAT, STATE_X1, 0 }, /* DE */ { NULL, JSON_FLOAT, STATE_R1, 0 }, /* DF */ { act_se, JSON_NONE, 0, 0 }, /* SE */ { NULL, JSON_INT, STATE_M0, 0 }, /* MX */ { NULL, JSON_INT, STATE_Z0, 0 }, /* ZX */ { NULL, JSON_INT, STATE_I0, 0 }, /* IX */ { act_uc, JSON_NONE, 0, 0 }, /* UC */ }; static int do_action(json_parser *parser, uint8_t next_state) { struct action_descr *descr = &actions_map[next_state & ~0x80]; if (descr->call) { int ret; if (descr->dobuffer) CHK(do_buffer(parser)); CHK((descr->call)(parser)); } if (descr->state) parser->state = descr->state; parser->type = descr->type; return 0; } /** json_parser_init initialize a parser structure taking a config, * a config and its userdata. * return JSON_ERROR_NO_MEMORY if memory allocation failed or SUCCESS. */ int json_parser_init(json_parser *parser, json_config *config, json_parser_callback callback, void *userdata) { memset(parser, 0, sizeof(*parser)); if (config) memcpy(&parser->config, config, sizeof(json_config)); parser->callback = callback; parser->userdata = userdata; /* initialise parsing stack and state */ parser->stack_offset = 0; parser->state = STATE_GO; /* initialize the parse stack */ parser->stack_size = (parser->config.max_nesting > 0) ? parser->config.max_nesting : LIBJSON_DEFAULT_STACK_SIZE; parser->stack = (uint8_t *)parser_malloc(parser, parser->stack_size * sizeof(parser->stack[0])); if (!parser->stack) return JSON_ERROR_NO_MEMORY; /* initialize the parse buffer */ parser->buffer_size = (parser->config.buffer_initial_size > 0) ? parser->config.buffer_initial_size : LIBJSON_DEFAULT_BUFFER_SIZE; if (parser->config.max_data > 0 && parser->buffer_size > parser->config.max_data) parser->buffer_size = parser->config.max_data; parser->buffer = (char *)parser_malloc(parser, parser->buffer_size * sizeof(char)); if (!parser->buffer) { parser_free(parser, parser->stack); return JSON_ERROR_NO_MEMORY; } return 0; } /** json_parser_free freed memory structure allocated by the parser */ int json_parser_free(json_parser *parser) { if (!parser) return 0; parser_free(parser, parser->stack); parser_free(parser, parser->buffer); parser->stack = NULL; parser->buffer = NULL; return 0; } /** json_parser_is_done return 0 is the parser isn't in a finish state. !0 if it is */ int json_parser_is_done(json_parser *parser) { /* need to compare the state to !GO to not accept empty document */ return parser->stack_offset == 0 && parser->state != STATE_GO; } /** json_parser_string append a string s with a specific length to the parser * return 0 if everything went ok, a JSON_ERROR_* otherwise. * the user can supplied a valid processed pointer that will * be fill with the number of processed characters before returning */ int json_parser_string(json_parser *parser, const char *s, uint32_t length, uint32_t *processed) { int ret; uint8_t next_class, next_state; uint32_t buffer_policy; uint32_t i; ret = 0; for (i = 0; i < length; i++) { unsigned char ch = s[i]; ret = 0; next_class = (ch >= 128) ? (uint8_t)(C_OTHER) : (uint8_t)(character_class[ch]); if (next_class == C_ERROR) { ret = JSON_ERROR_BAD_CHAR; break; } next_state = state_transition_table[parser->state][next_class]; buffer_policy = buffer_policy_table[parser->state][next_class]; if (next_state == STATE___) { ret = JSON_ERROR_UNEXPECTED_CHAR; break; } /* add char to buffer */ if (buffer_policy) { ret = (buffer_policy == 2) ? buffer_push_escape(parser, ch) : buffer_push(parser, ch); if (ret) break; } /* move to the next level */ if (IS_STATE_ACTION(next_state)) ret = do_action(parser, next_state); else parser->state = next_state; if (ret) break; } if (processed) *processed = i; return ret; } /** json_parser_char append one single char to the parser * return 0 if everything went ok, a JSON_ERROR_* otherwise */ int json_parser_char(json_parser *parser, unsigned char ch) { return json_parser_string(parser, (char *) &ch, 1, NULL); }