src/lib/url.c
author Tero Marttila <terom@fixme.fi>
Wed, 08 Oct 2008 22:05:13 +0300
changeset 15 a8d183e79ed9
parent 14 115067dfba55
child 16 74fb62022fb3
permissions -rw-r--r--
look ma, it compiles\!
15
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
     1
#define _GNU_SOURCE
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
     2
#include <stdlib.h>
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
     3
#include <string.h>
13
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
     4
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
     5
#include "url.h"
15
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
     6
#include "lex.h"
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
     7
#include "error.h"
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
     8
#include "misc.h"
13
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
     9
14
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
    10
enum url_token {
13
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    11
    URL_INVALID,
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    12
    
14
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
    13
    URL_BEGIN,
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
    14
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
    15
    // kludge to resolve ambiguous URL_SCHEME/URL_USERNAME+URL_PASSWORD/URL_HOSTNAME+URL_SERVICE at the beginning
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
    16
    URL_BEGIN_ALNUM,
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
    17
    URL_BEGIN_COLON,
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
    18
13
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    19
    URL_SCHEME,
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    20
    URL_SCHEME_SEP,
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    21
    URL_SCHEME_END_COL,
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    22
    URL_SCHEME_END_SLASH1,
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    23
    URL_SCHEME_END_SLASH2,
14
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
    24
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
    25
    // kludge to resolve ambiguous URL_USERNAME+URL_PASSWORD/URL_HOSTNAME+URL_SERVICE after a scheme 
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
    26
    URL_USERHOST_ALNUM,
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
    27
    URL_USERHOST_COLON,
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
    28
    URL_USERHOST_ALNUM2,
13
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    29
    
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    30
    URL_USERNAME,
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    31
    URL_PASSWORD_SEP,
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    32
    URL_PASSWORD,
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    33
    URL_USERNAME_END,
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    34
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    35
    URL_HOSTNAME,
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    36
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    37
    URL_SERVICE_SEP,
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    38
    URL_SERVICE,
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    39
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    40
    URL_PATH_START,
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    41
    URL_PATH,
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    42
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    43
    URL_OPT_START,
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    44
    URL_OPT_KEY,
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    45
    URL_OPT_EQ,
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    46
    URL_OPT_VAL,
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    47
    URL_OPT_SEP,
14
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
    48
    
13
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    49
    URL_MAX,
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    50
};
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    51
14
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
    52
/*
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
    53
 * Parser state
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
    54
 */
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
    55
struct url_state {
15
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    56
    // the URL to parse into
14
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
    57
    struct url *url;
15
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    58
    
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    59
    // our lookahead-kludge
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    60
    const char *alnum, *alnum2;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    61
    
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    62
};
13
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    63
15
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    64
static int _url_append_scheme (struct url *url, const char *data) {
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    65
    
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    66
}
13
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    67
15
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    68
static int _url_append_opt_key (struct url *url, const char *key) {
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    69
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    70
}
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    71
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    72
static int _url_append_opt_val (struct url *url, const char *value) {
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    73
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    74
}
13
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    75
14
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
    76
static int url_lex_token (int _this_token, char *token_data, int _next_token, int _prev_token, void *arg) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
    77
    enum url_token this_token = _this_token, next_token = _next_token, prev_token = _prev_token;
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
    78
    struct url_state *state = arg;
15
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    79
    const char **copy_to = NULL;
13
385b9a10d096 inital playing around with a lexer/url parser
Tero Marttila <terom@fixme.fi>
parents:
diff changeset
    80
15
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    81
    (void) prev_token;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    82
    
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    83
    switch (this_token) {
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    84
        case URL_BEGIN_ALNUM:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    85
            switch (next_token) {
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    86
                case URL_SCHEME_SEP:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    87
                    // store the scheme
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    88
                    if (_url_append_scheme(state->url, token_data))
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    89
                        goto error;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    90
                    
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    91
                    break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    92
                
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    93
                case URL_USERNAME_END:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    94
                    // store the username
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    95
                    copy_to = &state->url->username; break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    96
                
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    97
                case URL_PATH_START:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    98
                case URL_OPT_START:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
    99
                case LEX_EOF:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   100
                    // store the hostname
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   101
                    copy_to = &state->url->hostname; break;
14
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   102
15
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   103
                case URL_BEGIN_COLON:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   104
                    // gah...
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   105
                    copy_to = &state->alnum; break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   106
                
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   107
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   108
                default:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   109
                    FATAL("weird next token");
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   110
            }
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   111
            
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   112
            break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   113
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   114
        case URL_BEGIN_COLON:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   115
            switch (next_token) {
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   116
                case URL_SCHEME_END_SLASH1:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   117
                    // store the schema
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   118
                    if (_url_append_scheme(state->url, token_data))
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   119
                        goto error;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   120
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   121
                    break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   122
                
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   123
                case URL_USERHOST_ALNUM2:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   124
                    // gah..
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   125
                    break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   126
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   127
                default:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   128
                    FATAL("weird next token");
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   129
            }
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   130
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   131
            break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   132
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   133
        case URL_SCHEME:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   134
            // store the scheme
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   135
            if (_url_append_scheme(state->url, token_data))
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   136
                goto error;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   137
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   138
            break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   139
    
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   140
        case URL_SCHEME_SEP:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   141
            // ignore
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   142
            break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   143
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   144
        case URL_SCHEME_END_COL:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   145
        case URL_SCHEME_END_SLASH1:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   146
        case URL_SCHEME_END_SLASH2:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   147
            // ignore
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   148
            break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   149
        
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   150
        case URL_USERHOST_ALNUM:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   151
            switch (next_token) {
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   152
                case URL_USERNAME_END:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   153
                    // store the username
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   154
                    copy_to = &state->url->username; break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   155
                
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   156
                case URL_PATH_START:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   157
                case URL_OPT_START:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   158
                case LEX_EOF:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   159
                    // store the hostname
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   160
                    copy_to = &state->url->hostname; break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   161
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   162
                case URL_USERHOST_COLON:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   163
                    // gah...
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   164
                    copy_to = &state->alnum; break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   165
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   166
                default:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   167
                    FATAL("weird next token");
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   168
            }
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   169
            
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   170
            break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   171
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   172
        case URL_USERHOST_COLON:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   173
            // ignore
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   174
            break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   175
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   176
        case URL_USERHOST_ALNUM2:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   177
            switch (next_token) {
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   178
                case URL_USERNAME_END:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   179
                    // store the username and password
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   180
                    state->url->username = state->alnum; state->alnum = NULL;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   181
                    copy_to = &state->url->password;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   182
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   183
                    break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   184
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   185
                case URL_PATH_START:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   186
                case URL_OPT_START:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   187
                case LEX_EOF:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   188
                    // store the service
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   189
                    copy_to = &state->url->service; break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   190
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   191
                default:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   192
                    FATAL("weird next token");
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   193
            }
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   194
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   195
            break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   196
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   197
        case URL_USERNAME:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   198
        case URL_PASSWORD_SEP:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   199
        case URL_PASSWORD:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   200
            FATAL("these should be overshadowed");
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   201
        
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   202
        case URL_USERNAME_END:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   203
            // ignore
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   204
            break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   205
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   206
        case URL_HOSTNAME:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   207
            // store
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   208
            copy_to = &state->url->hostname; break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   209
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   210
        case URL_SERVICE_SEP:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   211
            // ignore
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   212
            break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   213
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   214
        case URL_SERVICE:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   215
            // store
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   216
            copy_to = &state->url->service; break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   217
        
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   218
        case URL_PATH_START:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   219
            // ignore
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   220
            break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   221
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   222
        case URL_PATH:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   223
            // store
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   224
            copy_to = &state->url->path; break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   225
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   226
        case URL_OPT_START:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   227
            // ignore
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   228
            break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   229
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   230
        case URL_OPT_KEY:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   231
            // store
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   232
            if (_url_append_opt_key(state->url, token_data))
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   233
                goto error;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   234
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   235
            break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   236
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   237
        case URL_OPT_EQ:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   238
            // ignore
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   239
            break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   240
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   241
        case URL_OPT_VAL:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   242
            // store
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   243
            if (_url_append_opt_val(state->url, token_data))
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   244
                goto error;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   245
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   246
            break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   247
        
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   248
        case URL_OPT_SEP:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   249
            // ignore
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   250
            break;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   251
        
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   252
        default:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   253
            FATAL("invalid token");
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   254
    }
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   255
    
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   256
    if (copy_to) {
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   257
        // copy the token data
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   258
        if ((*copy_to = strdup(token_data)) == NULL)
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   259
            ERROR("strdup");
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   260
    }
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   261
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   262
    // good
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   263
    return 0;
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   264
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   265
error:
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   266
    // XXX: error codes?
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   267
    return -1;
14
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   268
}
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   269
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   270
static struct lex url_lex = {
15
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   271
    .token_fn = url_lex_token,
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   272
    .char_fn = NULL,
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   273
    .end_fn = NULL,
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   274
14
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   275
    .state_count = URL_MAX,
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   276
    .state_list = {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   277
        LEX_STATE ( URL_BEGIN ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   278
            LEX_ALNUM       (           URL_BEGIN_ALNUM         ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   279
            LEX_CHAR        (   ':',    URL_SERVICE_SEP         ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   280
            LEX_CHAR        (   '/',    URL_PATH_START          ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   281
            LEX_CHAR        (   '?',    URL_OPT_START           ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   282
            LEX_END
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   283
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   284
        
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   285
        // this can be URL_SCHEME, URL_USERNAME or URL_HOSTNAME
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   286
        LEX_STATE_END ( URL_BEGIN_ALNUM ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   287
            LEX_ALNUM       (           URL_BEGIN_ALNUM         ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   288
            LEX_CHAR        (   '+',    URL_SCHEME_SEP          ),  // it was URL_SCHEME
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   289
            LEX_CHAR        (   ':',    URL_BEGIN_COLON         ), 
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   290
            LEX_CHAR        (   '@',    URL_USERNAME_END        ),  // it was URL_USERNAME
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   291
            LEX_CHAR        (   '/',    URL_PATH_START          ),  // it was URL_HOSTNAME
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   292
            LEX_CHAR        (   '?',    URL_OPT_START           ),  // it was URL_HOSTNAME
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   293
            LEX_END
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   294
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   295
        
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   296
        // this can be URL_SCHEME_END_COL, URL_USERNAME_END or URL_SERVICE_SEP
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   297
        LEX_STATE ( URL_BEGIN_COLON ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   298
            LEX_CHAR        (   '/',    URL_SCHEME_END_SLASH1   ),  // it was URL_SCHEME
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   299
            LEX_ALNUM       (           URL_USERHOST_ALNUM2     ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   300
            LEX_END
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   301
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   302
       
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   303
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   304
        LEX_STATE ( URL_SCHEME ) { 
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   305
            LEX_ALNUM       (           URL_SCHEME              ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   306
            LEX_CHAR        (   '+',    URL_SCHEME_SEP          ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   307
            LEX_CHAR        (   ':',    URL_SCHEME_END_COL      ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   308
            LEX_END
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   309
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   310
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   311
        LEX_STATE ( URL_SCHEME_SEP ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   312
            LEX_ALNUM       (           URL_SCHEME              ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   313
            LEX_END
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   314
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   315
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   316
        LEX_STATE ( URL_SCHEME_END_COL ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   317
            LEX_CHAR        (   '/',    URL_SCHEME_END_SLASH1   ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   318
            LEX_END
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   319
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   320
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   321
        LEX_STATE ( URL_SCHEME_END_SLASH1 ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   322
            LEX_CHAR        (   '/',    URL_SCHEME_END_SLASH2   ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   323
            LEX_END
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   324
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   325
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   326
        LEX_STATE_END ( URL_SCHEME_END_SLASH2 ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   327
            LEX_ALNUM       (           URL_USERHOST_ALNUM      ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   328
            LEX_CHAR        (   ':',    URL_SERVICE_SEP         ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   329
            LEX_CHAR        (   '/',    URL_PATH_START          ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   330
            LEX_CHAR        (   '?',    URL_OPT_START           ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   331
            LEX_END
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   332
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   333
        
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   334
        // this can be URL_USERNAME or URL_HOSTNAME
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   335
        LEX_STATE_END ( URL_USERHOST_ALNUM ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   336
            LEX_ALNUM       (           URL_USERHOST_ALNUM      ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   337
            LEX_CHAR        (   ':',    URL_USERHOST_COLON      ), 
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   338
            LEX_CHAR        (   '@',    URL_USERNAME_END        ),  // it was URL_USERNAME
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   339
            LEX_CHAR        (   '/',    URL_PATH_START          ),  // it was URL_HOSTNAME
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   340
            LEX_CHAR        (   '?',    URL_OPT_START           ),  // it was URL_HOSTNAME
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   341
            LEX_END
15
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   342
        },
14
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   343
        
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   344
        // this can be URL_USERNAME_END or URL_SERVICE_SEP
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   345
        LEX_STATE ( URL_USERHOST_COLON ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   346
            LEX_ALNUM       (           URL_USERHOST_ALNUM2        ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   347
            LEX_END
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   348
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   349
        
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   350
        // this can be URL_PASSWORD or URL_SERVICE
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   351
        LEX_STATE_END ( URL_USERHOST_ALNUM2 ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   352
            LEX_ALNUM       (           URL_USERHOST_ALNUM      ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   353
            LEX_CHAR        (   '@',    URL_USERNAME_END        ),  // it was URL_PASSSWORD
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   354
            LEX_CHAR        (   '/',    URL_PATH_START          ),  // it was URL_SERVICE
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   355
            LEX_CHAR        (   '?',    URL_OPT_START           ),  // it was URL_SERVICE
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   356
            LEX_END
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   357
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   358
        
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   359
        // dummy states, covered by URL_USERHOST_ALNUM/URL_USERHOST_COLON/URL_USERHOST_ALNUM2
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   360
        LEX_STATE ( URL_USERNAME ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   361
            LEX_END
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   362
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   363
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   364
        LEX_STATE ( URL_PASSWORD_SEP ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   365
            LEX_END
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   366
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   367
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   368
        LEX_STATE ( URL_PASSWORD ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   369
            LEX_END
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   370
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   371
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   372
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   373
        LEX_STATE_END ( URL_USERNAME_END ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   374
            LEX_ALNUM       (           URL_HOSTNAME            ), 
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   375
            LEX_CHAR        (   ':',    URL_SERVICE_SEP         ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   376
            LEX_CHAR        (   '/',    URL_PATH_START          ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   377
            LEX_CHAR        (   '?',    URL_OPT_START           ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   378
            LEX_END
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   379
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   380
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   381
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   382
        LEX_STATE_END ( URL_HOSTNAME ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   383
            LEX_ALNUM       (           URL_HOSTNAME            ), 
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   384
            LEX_CHAR        (   ':',    URL_SERVICE_SEP         ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   385
            LEX_CHAR        (   '/',    URL_PATH_START          ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   386
            LEX_CHAR        (   '?',    URL_OPT_START           ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   387
            LEX_END
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   388
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   389
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   390
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   391
        LEX_STATE ( URL_SERVICE_SEP ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   392
            LEX_ALNUM       (           URL_SERVICE            ), 
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   393
            LEX_CHAR        (   '/',    URL_PATH_START          ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   394
            LEX_CHAR        (   '?',    URL_OPT_START           ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   395
            LEX_END
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   396
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   397
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   398
        LEX_STATE_END ( URL_SERVICE ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   399
            LEX_ALNUM       (           URL_SERVICE            ), 
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   400
            LEX_CHAR        (   '/',    URL_PATH_START          ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   401
            LEX_CHAR        (   '?',    URL_OPT_START           ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   402
            LEX_END
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   403
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   404
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   405
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   406
        LEX_STATE_END ( URL_PATH_START ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   407
            LEX_CHAR        (   '?',    URL_OPT_START           ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   408
            LEX_DEFAULT     (           URL_PATH                ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   409
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   410
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   411
        LEX_STATE_END ( URL_PATH ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   412
            LEX_CHAR        (   '?',    URL_OPT_START           ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   413
            LEX_DEFAULT     (           URL_PATH                ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   414
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   415
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   416
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   417
        LEX_STATE_END ( URL_OPT_START ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   418
            LEX_CHAR        (   '&',    URL_OPT_SEP             ),
15
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   419
            LEX_INVALID     (   '='                             ),
14
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   420
            LEX_DEFAULT     (           URL_OPT_KEY             ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   421
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   422
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   423
        LEX_STATE_END ( URL_OPT_KEY ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   424
            LEX_CHAR        (   '&',    URL_OPT_SEP             ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   425
            LEX_CHAR        (   '=',    URL_OPT_EQ              ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   426
            LEX_DEFAULT     (           URL_OPT_KEY             ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   427
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   428
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   429
        LEX_STATE_END ( URL_OPT_EQ ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   430
            LEX_CHAR        (   '&',    URL_OPT_SEP             ),
15
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   431
            LEX_INVALID     (   '='                             ),
14
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   432
            LEX_DEFAULT     (           URL_OPT_VAL             ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   433
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   434
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   435
        LEX_STATE_END ( URL_OPT_VAL ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   436
            LEX_CHAR        (   '&',    URL_OPT_SEP             ),
15
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   437
            LEX_INVALID     (   '='                             ),
14
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   438
            LEX_DEFAULT     (           URL_OPT_VAL             ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   439
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   440
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   441
        LEX_STATE_END ( URL_OPT_SEP ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   442
            LEX_CHAR        (   '&',    URL_OPT_SEP             ),
15
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   443
            LEX_INVALID     (   '='                             ),
14
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   444
            LEX_DEFAULT     (           URL_OPT_KEY             ),
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   445
        },
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   446
        
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   447
        LEX_STATE ( URL_ERROR ) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   448
            LEX_END
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   449
        },
15
a8d183e79ed9 look ma, it compiles\!
Tero Marttila <terom@fixme.fi>
parents: 14
diff changeset
   450
    }
14
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   451
};
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   452
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   453
int url_parse (struct url *url, const char *text) {
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   454
    struct url_state state; ZINIT(state);
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   455
    int ret;
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   456
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   457
    // set up state
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   458
    state.url = url;
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   459
    
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   460
    // parse it
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   461
    if ((ret = lexer(&url_lex, text, &state)))
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   462
        ERROR("invalid URL");
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   463
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   464
    // success
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   465
    return 0;
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   466
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   467
error:
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   468
    return -1;
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   469
}
115067dfba55 more intermediate work
Tero Marttila <terom@fixme.fi>
parents: 13
diff changeset
   470