mirror of git://erdgeist.org/opentracker
Our scanner routine for the URI query string
parent
88679832f0
commit
2adf4fb28a
@ -0,0 +1,57 @@
|
|||||||
|
#include "scan.h"
|
||||||
|
|
||||||
|
#define BREAK_AT_QUESTIONMARK (1<<0)
|
||||||
|
#define BREAK_AT_WHITESPACE (1<<1)
|
||||||
|
#define BREAK_AT_AMPERSAND (1<<2)
|
||||||
|
#define BREAK_AT_EQUALSIGN (1<<3)
|
||||||
|
|
||||||
|
#define SCAN_PATH ( BREAK_AT_QUESTIONMARK | BREAK_AT_WHITESPACE )
|
||||||
|
#define SCAN_SEARCHPATH_PARAM ( BREAK_AT_EQUALSIGN )
|
||||||
|
#define SCAN_SEARCHPATH_VALUE ( BREAK_AT_AMPERSAND | BREAK_AT_WHITESPACE )
|
||||||
|
|
||||||
|
// Idea is to do a in place replacement or guarantee at least
|
||||||
|
// strlen( string ) bytes in deststring
|
||||||
|
// watch http://www.ietf.org/rfc/rfc2396.txt
|
||||||
|
// unreserved = alphanum | mark
|
||||||
|
// mark = "-" | "_" | "." | "!" | "~" | "*" | "'" | "(" | ")"
|
||||||
|
// we add '%' to the matrix to not stop at encoded chars.
|
||||||
|
|
||||||
|
static const unsigned char reserved_matrix[] = { 0xA2, 0x63, 0xFF, 0x03, 0xFE, 0xFF, 0xFF, 0x87, 0xFE, 0xFF, 0xFF, 0x47};
|
||||||
|
inline int is_unreserved( unsigned char c ) const {
|
||||||
|
if( ( c <= 32 ) || ( c >= 127 ) ) return 0; return 1&(reserved_matrix[(c-32)>>3]>>(c&7));
|
||||||
|
}
|
||||||
|
|
||||||
|
size_t scan_urlencoded_query(char **string, char *deststring, int flags) {
|
||||||
|
register const unsigned char* s=*(const unsigned char*) string;
|
||||||
|
const unsigned char *d = deststring;
|
||||||
|
register unsigned char b, c;
|
||||||
|
|
||||||
|
while ( is_unreserved( c = *s++) ) {
|
||||||
|
if (c=='%') {
|
||||||
|
if( ( c = scan_fromhex(*s++) ) < 0 ) return -1;
|
||||||
|
if( ( b = scan_fromhex(*s++) ) < 0 ) return -1;
|
||||||
|
c=(c<<4)|b;
|
||||||
|
}
|
||||||
|
*d++ = c;
|
||||||
|
}
|
||||||
|
|
||||||
|
switch( c ) {
|
||||||
|
case 0: case '\r': case '\n': case ' ':
|
||||||
|
if ( flags & BREAK_AT_WHITESPACE == 0 ) return -1;
|
||||||
|
break;
|
||||||
|
case '?':
|
||||||
|
if ( flags & BREAK_AT_QUESTIONMARK == 0 ) return -1;
|
||||||
|
break;
|
||||||
|
case '=':
|
||||||
|
if ( flags & BREAK_AT_EQUALSIGN == 0 ) return -1;
|
||||||
|
break;
|
||||||
|
case '&':
|
||||||
|
if ( flags & BREAK_AT_AMPERSAND == 0 ) return -1;
|
||||||
|
break;
|
||||||
|
default:
|
||||||
|
return -1;
|
||||||
|
}
|
||||||
|
|
||||||
|
*string = s;
|
||||||
|
return d - deststring;
|
||||||
|
}
|
@ -0,0 +1,20 @@
|
|||||||
|
#ifdef __SCAN_URLENCODED_QUERY_H__
|
||||||
|
#define __SCAN_URLENCODED_QUERY_H__
|
||||||
|
|
||||||
|
#define BREAK_AT_QUESTIONMARK (1<<0)
|
||||||
|
#define BREAK_AT_WHITESPACE (1<<1)
|
||||||
|
#define BREAK_AT_AMPERSAND (1<<2)
|
||||||
|
#define BREAK_AT_EQUALSIGN (1<<3)
|
||||||
|
|
||||||
|
#define SCAN_PATH ( BREAK_AT_QUESTIONMARK | BREAK_AT_WHITESPACE )
|
||||||
|
#define SCAN_SEARCHPATH_PARAM ( BREAK_AT_EQUALSIGN )
|
||||||
|
#define SCAN_SEARCHPATH_VALUE ( BREAK_AT_AMPERSAND | BREAK_AT_WHITESPACE )
|
||||||
|
|
||||||
|
// string pointer to source, pointer to after terminator on return
|
||||||
|
// deststring pointer to destination
|
||||||
|
// flags determines, what to parse
|
||||||
|
// returns number of valid converted characters in deststring
|
||||||
|
// or -1 for parse error
|
||||||
|
size_t scan_urlencoded_query(char **string, char *deststring, int flags);
|
||||||
|
|
||||||
|
#endif
|
Loading…
Reference in New Issue