summaryrefslogtreecommitdiff
path: root/scan_urlencoded_query.c
blob: 7aeabab335f7f1ef0b0f6eb30efa97fb1deb0768 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
#include "scan.h"

#define BREAK_AT_QUESTIONMARK (1<<0)
#define BREAK_AT_WHITESPACE   (1<<1)
#define BREAK_AT_AMPERSAND    (1<<2)
#define BREAK_AT_EQUALSIGN    (1<<3)

#define SCAN_PATH             ( BREAK_AT_QUESTIONMARK | BREAK_AT_WHITESPACE )
#define SCAN_SEARCHPATH_PARAM ( BREAK_AT_EQUALSIGN )
#define SCAN_SEARCHPATH_VALUE ( BREAK_AT_AMPERSAND | BREAK_AT_WHITESPACE )

// Idea is to do a in place replacement or guarantee at least
// strlen( string ) bytes in deststring
// watch http://www.ietf.org/rfc/rfc2396.txt
//       unreserved    = alphanum | mark
//       mark          = "-" | "_" | "." | "!" | "~" | "*" | "'" | "(" | ")"
// we add '%' to the matrix to not stop at encoded chars.

static const unsigned char reserved_matrix[] = { 0xA2, 0x63, 0xFF, 0x03, 0xFE, 0xFF, 0xFF, 0x87, 0xFE, 0xFF, 0xFF, 0x47};
inline int is_unreserved( unsigned char c ) const {
  if( ( c <= 32 ) || ( c >= 127 ) ) return 0; return 1&(reserved_matrix[(c-32)>>3]>>(c&7));
}

size_t scan_urlencoded_query(char **string, char *deststring, int flags) {
  register const unsigned char* s=*(const unsigned char*) string;
  const unsigned char *d = deststring;
  register unsigned char b, c;

  while ( is_unreserved( c = *s++) ) {
    if (c=='%') {
      if( ( c = scan_fromhex(*s++) ) < 0 ) return -1;
      if( ( b = scan_fromhex(*s++) ) < 0 ) return -1;
      c=(c<<4)|b;
    }
    *d++ = c;
  }

  switch( c ) {
  case 0: case '\r': case '\n': case ' ':
    if ( flags & BREAK_AT_WHITESPACE == 0 ) return -1;
    break;
  case '?':
    if ( flags & BREAK_AT_QUESTIONMARK == 0 ) return -1;
    break;
  case '=':
    if ( flags & BREAK_AT_EQUALSIGN == 0 ) return -1;
    break;
  case '&':
    if ( flags & BREAK_AT_AMPERSAND == 0 ) return -1;
    break;
  default:
    return -1;
  }

  *string = s;
  return d - deststring;
}