lws-api-doc-main/html/lws-tokenize_8h_source.html

/*

 * libwebsockets - small server side websockets and web server implementation

 *

 * Copyright (C) 2010 - 2019 Andy Green <andy@warmcat.com>

 *

 * Permission is hereby granted, free of charge, to any person obtaining a copy

 * of this software and associated documentation files (the "Software"), to

 * deal in the Software without restriction, including without limitation the

 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or

 * sell copies of the Software, and to permit persons to whom the Software is

 * furnished to do so, subject to the following conditions:

 *

 * The above copyright notice and this permission notice shall be included in

 * all copies or substantial portions of the Software.

 *

 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR

 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,

 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE

 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER

 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING

 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS

 * IN THE SOFTWARE.

 */


/* Do not treat - as a terminal character, so "my-token" is one token */

#define LWS_TOKENIZE_F_MINUS_NONTERM    (1 << 0)

/* Separately report aggregate colon-delimited tokens */

#define LWS_TOKENIZE_F_AGG_COLON        (1 << 1)

/* Enforce sequencing for a simple token , token , token ... list */

#define LWS_TOKENIZE_F_COMMA_SEP_LIST   (1 << 2)

/* Allow more characters in the tokens and less delimiters... default is

 * only alphanumeric + underscore in tokens */

#define LWS_TOKENIZE_F_RFC7230_DELIMS   (1 << 3)

/* Do not treat . as a terminal character, so "warmcat.com" is one token */

#define LWS_TOKENIZE_F_DOT_NONTERM      (1 << 4)

/* If something starts looking like a float, like 1.2, force to be string token.

 * This lets you receive dotted-quads like 192.168.0.1 as string tokens, and

 * avoids illegal float format detection like 1.myserver.com */

#define LWS_TOKENIZE_F_NO_FLOATS        (1 << 5)

/* Instead of LWS_TOKZE_INTEGER, report integers as any other string token */

#define LWS_TOKENIZE_F_NO_INTEGERS      (1 << 6)

/* # makes the rest of the line a comment */

#define LWS_TOKENIZE_F_HASH_COMMENT     (1 << 7)

/* Do not treat / as a terminal character, so "multipart/related" is one token */

#define LWS_TOKENIZE_F_SLASH_NONTERM    (1 << 8)

/* Do not treat * as a terminal character, so "myfile*" is one token */

#define LWS_TOKENIZE_F_ASTERISK_NONTERM (1 << 9)

/* Do not treat = as a terminal character, so "x=y" is one token */

#define LWS_TOKENIZE_F_EQUALS_NONTERM   (1 << 10)

/* Do not treat : as a terminal character, so ::1 is one token */

#define LWS_TOKENIZE_F_COLON_NONTERM    (1 << 11)


/* We're just tokenizing a chunk, don't treat running out of input as final */

#define LWS_TOKENIZE_F_EXPECT_MORE      (1 << 12)


typedef enum {


        LWS_TOKZE_ERRS                    =  7, /* the number of errors defined */


        LWS_TOKZE_TOO_LONG            = -7,   /* token too long */

        LWS_TOKZE_WANT_READ          = -6,   /* need more input */

        LWS_TOKZE_ERR_BROKEN_UTF8      = -5,   /* malformed or partial utf8 */

        LWS_TOKZE_ERR_UNTERM_STRING  = -4,   /* ended while we were in "" */

        LWS_TOKZE_ERR_MALFORMED_FLOAT      = -3,   /* like 0..1 or 0.1.1 */

        LWS_TOKZE_ERR_NUM_ON_LHS        = -2,   /* like 123= or 0.1= */

        LWS_TOKZE_ERR_COMMA_LIST        = -1,   /* like ",tok", or, "tok,," */


        LWS_TOKZE_ENDED = 0,             /* no more content */


        /* Note: results have ordinal 1+, EOT is 0 and errors are < 0 */


        LWS_TOKZE_DELIMITER,         /* a delimiter appeared */

        LWS_TOKZE_TOKEN,         /* a token appeared */

        LWS_TOKZE_INTEGER,             /* an integer appeared */

        LWS_TOKZE_FLOAT,         /* a float appeared */

        LWS_TOKZE_TOKEN_NAME_EQUALS, /* token [whitespace] = */

        LWS_TOKZE_TOKEN_NAME_COLON,   /* token [whitespace] : (only with

                                           LWS_TOKENIZE_F_AGG_COLON flag) */

        LWS_TOKZE_QUOTED_STRING, /* "*", where * may have any char */


} lws_tokenize_elem;


/*

 * helper enums to allow caller to enforce legal delimiter sequencing, eg

 * disallow "token,,token", "token,", and ",token"

 */


enum lws_tokenize_delimiter_tracking {

        LWSTZ_DT_NEED_FIRST_CONTENT,

        LWSTZ_DT_NEED_DELIM,

        LWSTZ_DT_NEED_NEXT_CONTENT,

};


typedef enum {

        LWS_TOKZS_LEADING_WHITESPACE,

        LWS_TOKZS_QUOTED_STRING,

        LWS_TOKZS_TOKEN,

        LWS_TOKZS_TOKEN_POST_TERMINAL

} lws_tokenize_state;


typedef struct lws_tokenize {

        char collect[256]; /* token length limit */

        const char *start;

        const char *token;

        size_t len;

        size_t token_len;


        lws_tokenize_state state;


        int line;

        int effline;


        uint16_t flags;

        uint8_t delim;


        int8_t e;

        uint8_t reset_token:1;

        uint8_t crlf:1;

        uint8_t dry:1;

} lws_tokenize_t;


LWS_VISIBLE LWS_EXTERN void

lws_tokenize_init(struct lws_tokenize *ts, const char *start, int flags);


LWS_VISIBLE LWS_EXTERN lws_tokenize_elem

lws_tokenize(struct lws_tokenize *ts);


LWS_VISIBLE LWS_EXTERN int

lws_tokenize_cstr(struct lws_tokenize *ts, char *str, size_t max);


/*

 * lws_strexp: flexible string expansion helper api

 *

 * This stateful helper can handle multiple separate input chunks and multiple

 * output buffer loads with arbitrary boundaries between literals and expanded

 * symbols.  This allows it to handle fragmented input as well as arbitrarily

 * long symbol expansions that are bigger than the output buffer itself.

 *

 * A user callback is used to convert symbol names to the symbol value.

 *

 * A single byte buffer for input and another for output can process any

 * length substitution then.  The state object is around 64 bytes on a 64-bit

 * system and it only uses 8 bytes stack.

 */


typedef int (*lws_strexp_expand_cb)(void *priv, const char *name, char *out,

                                    size_t *pos, size_t olen, size_t *exp_ofs);


typedef struct lws_strexp {

        char                    name[32];

        lws_strexp_expand_cb        cb;

        void                    *priv;

        char                    *out;

        size_t                  olen;

        size_t                  pos;


        size_t                  exp_ofs;


        uint8_t                  name_pos;

        char                    state;

} lws_strexp_t;


enum {

        LSTRX_DONE,                   /* it completed OK */

        LSTRX_FILLED_OUT,               /* out buf filled and needs resetting */

        LSTRX_FATAL_NAME_TOO_LONG = -1,        /* fatal */

        LSTRX_FATAL_NAME_UNKNOWN  = -2,

};


LWS_VISIBLE LWS_EXTERN void

lws_strexp_init(lws_strexp_t *exp, void *priv, lws_strexp_expand_cb cb,

                char *out, size_t olen);


LWS_VISIBLE LWS_EXTERN void

lws_strexp_reset_out(lws_strexp_t *exp, char *out, size_t olen);


LWS_VISIBLE LWS_EXTERN int

lws_strexp_expand(lws_strexp_t *exp, const char *in, size_t len,

                  size_t *pused_in, size_t *pused_out);


LWS_VISIBLE LWS_EXTERN int

lws_strcmp_wildcard(const char *wildcard, size_t wlen, const char *check,

                    size_t clen);

uint16_t
unsigned short uint16_t
Definition libwebsockets.h:581

LWS_EXTERN
#define LWS_EXTERN
Definition libwebsockets.h:235

uint8_t
unsigned char uint8_t
Definition libwebsockets.h:582

LWS_VISIBLE
#define LWS_VISIBLE
Definition libwebsockets.h:230

lws_tokenize_delimiter_tracking
lws_tokenize_delimiter_tracking
Definition lws-tokenize.h:88

LWSTZ_DT_NEED_NEXT_CONTENT
@ LWSTZ_DT_NEED_NEXT_CONTENT
Definition lws-tokenize.h:91

LWSTZ_DT_NEED_DELIM
@ LWSTZ_DT_NEED_DELIM
Definition lws-tokenize.h:90

LWSTZ_DT_NEED_FIRST_CONTENT
@ LWSTZ_DT_NEED_FIRST_CONTENT
Definition lws-tokenize.h:89

lws_tokenize::state
lws_tokenize_state state
Definition lws-tokenize.h:108

lws_strexp_init
LWS_VISIBLE LWS_EXTERN void lws_strexp_init(lws_strexp_t *exp, void *priv, lws_strexp_expand_cb cb, char *out, size_t olen)

lws_tokenize::dry
uint8_t dry
Definition lws-tokenize.h:119

lws_strexp::name
char name[32]
Definition lws-tokenize.h:195

lws_tokenize::reset_token
uint8_t reset_token
Definition lws-tokenize.h:117

lws_tokenize::token
const char * token
Definition lws-tokenize.h:104

lws_tokenize::len
size_t len
Definition lws-tokenize.h:105

lws_tokenize_t
struct lws_tokenize lws_tokenize_t

lws_strexp_expand_cb
int(* lws_strexp_expand_cb)(void *priv, const char *name, char *out, size_t *pos, size_t olen, size_t *exp_ofs)
Definition lws-tokenize.h:191

lws_tokenize::token_len
size_t token_len
Definition lws-tokenize.h:106

lws_strexp_reset_out
LWS_VISIBLE LWS_EXTERN void lws_strexp_reset_out(lws_strexp_t *exp, char *out, size_t olen)

lws_strexp::cb
lws_strexp_expand_cb cb
Definition lws-tokenize.h:196

lws_tokenize
LWS_VISIBLE LWS_EXTERN lws_tokenize_elem lws_tokenize(struct lws_tokenize *ts)

lws_strexp::out
char * out
Definition lws-tokenize.h:198

lws_tokenize::line
int line
Definition lws-tokenize.h:110

lws_strexp::state
char state
Definition lws-tokenize.h:205

lws_tokenize::e
int8_t e
Definition lws-tokenize.h:116

lws_strexp::priv
void * priv
Definition lws-tokenize.h:197

lws_strexp::pos
size_t pos
Definition lws-tokenize.h:200

lws_strexp_expand
LWS_VISIBLE LWS_EXTERN int lws_strexp_expand(lws_strexp_t *exp, const char *in, size_t len, size_t *pused_in, size_t *pused_out)

lws_tokenize::crlf
uint8_t crlf
Definition lws-tokenize.h:118

LSTRX_DONE
@ LSTRX_DONE
Definition lws-tokenize.h:209

LSTRX_FATAL_NAME_TOO_LONG
@ LSTRX_FATAL_NAME_TOO_LONG
Definition lws-tokenize.h:211

LSTRX_FATAL_NAME_UNKNOWN
@ LSTRX_FATAL_NAME_UNKNOWN
Definition lws-tokenize.h:212

LSTRX_FILLED_OUT
@ LSTRX_FILLED_OUT
Definition lws-tokenize.h:210

lws_tokenize_init
LWS_VISIBLE LWS_EXTERN void lws_tokenize_init(struct lws_tokenize *ts, const char *start, int flags)

lws_tokenize_state
lws_tokenize_state
Definition lws-tokenize.h:94

LWS_TOKZS_TOKEN
@ LWS_TOKZS_TOKEN
Definition lws-tokenize.h:97

LWS_TOKZS_TOKEN_POST_TERMINAL
@ LWS_TOKZS_TOKEN_POST_TERMINAL
Definition lws-tokenize.h:98

LWS_TOKZS_QUOTED_STRING
@ LWS_TOKZS_QUOTED_STRING
Definition lws-tokenize.h:96

LWS_TOKZS_LEADING_WHITESPACE
@ LWS_TOKZS_LEADING_WHITESPACE
Definition lws-tokenize.h:95

lws_tokenize_elem
lws_tokenize_elem
Definition lws-tokenize.h:56

LWS_TOKZE_ERR_NUM_ON_LHS
@ LWS_TOKZE_ERR_NUM_ON_LHS
Definition lws-tokenize.h:65

LWS_TOKZE_WANT_READ
@ LWS_TOKZE_WANT_READ
Definition lws-tokenize.h:61

LWS_TOKZE_TOKEN
@ LWS_TOKZE_TOKEN
Definition lws-tokenize.h:73

LWS_TOKZE_QUOTED_STRING
@ LWS_TOKZE_QUOTED_STRING
Definition lws-tokenize.h:79

LWS_TOKZE_ERR_MALFORMED_FLOAT
@ LWS_TOKZE_ERR_MALFORMED_FLOAT
Definition lws-tokenize.h:64

LWS_TOKZE_DELIMITER
@ LWS_TOKZE_DELIMITER
Definition lws-tokenize.h:72

LWS_TOKZE_TOKEN_NAME_EQUALS
@ LWS_TOKZE_TOKEN_NAME_EQUALS
Definition lws-tokenize.h:76

LWS_TOKZE_TOO_LONG
@ LWS_TOKZE_TOO_LONG
Definition lws-tokenize.h:60

LWS_TOKZE_FLOAT
@ LWS_TOKZE_FLOAT
Definition lws-tokenize.h:75

LWS_TOKZE_ERR_BROKEN_UTF8
@ LWS_TOKZE_ERR_BROKEN_UTF8
Definition lws-tokenize.h:62

LWS_TOKZE_ERRS
@ LWS_TOKZE_ERRS
Definition lws-tokenize.h:58

LWS_TOKZE_INTEGER
@ LWS_TOKZE_INTEGER
Definition lws-tokenize.h:74

LWS_TOKZE_ENDED
@ LWS_TOKZE_ENDED
Definition lws-tokenize.h:68

LWS_TOKZE_TOKEN_NAME_COLON
@ LWS_TOKZE_TOKEN_NAME_COLON
Definition lws-tokenize.h:77

LWS_TOKZE_ERR_UNTERM_STRING
@ LWS_TOKZE_ERR_UNTERM_STRING
Definition lws-tokenize.h:63

LWS_TOKZE_ERR_COMMA_LIST
@ LWS_TOKZE_ERR_COMMA_LIST
Definition lws-tokenize.h:66

lws_tokenize::flags
uint16_t flags
Definition lws-tokenize.h:113

lws_tokenize::delim
uint8_t delim
Definition lws-tokenize.h:114

lws_strexp::name_pos
uint8_t name_pos
Definition lws-tokenize.h:204

lws_tokenize::collect
char collect[256]
Definition lws-tokenize.h:102

lws_tokenize::start
const char * start
Definition lws-tokenize.h:103

lws_tokenize::effline
int effline
Definition lws-tokenize.h:111

lws_strexp::exp_ofs
size_t exp_ofs
Definition lws-tokenize.h:202

lws_tokenize_cstr
LWS_VISIBLE LWS_EXTERN int lws_tokenize_cstr(struct lws_tokenize *ts, char *str, size_t max)

lws_strexp_t
struct lws_strexp lws_strexp_t

lws_strcmp_wildcard
LWS_VISIBLE LWS_EXTERN int lws_strcmp_wildcard(const char *wildcard, size_t wlen, const char *check, size_t clen)

lws_strexp::olen
size_t olen
Definition lws-tokenize.h:199

lws_strexp
Definition lws-tokenize.h:194

lws_tokenize
Definition lws-tokenize.h:101