diff --git a/projects/mongrel_experimental/Manifest b/projects/mongrel_experimental/Manifest index cec6045d..942f019e 100644 --- a/projects/mongrel_experimental/Manifest +++ b/projects/mongrel_experimental/Manifest @@ -1,5 +1,16 @@ CHANGELOG COPYING +ext/uri_classifier/ext_help.h +ext/uri_classifier/extconf.rb +ext/uri_classifier/tst.h +ext/uri_classifier/tst_cleanup.c +ext/uri_classifier/tst_delete.c +ext/uri_classifier/tst_grow_node_free_list.c +ext/uri_classifier/tst_init.c +ext/uri_classifier/tst_insert.c +ext/uri_classifier/tst_search.c +ext/uri_classifier/uri_classifier.c +lib/mongrel_experimental.rb LICENSE Manifest README diff --git a/projects/mongrel_experimental/ext/uri_classifier/uri_classifier.c b/projects/mongrel_experimental/ext/uri_classifier/uri_classifier.c index d63e06e5..fccbc395 100644 --- a/projects/mongrel_experimental/ext/uri_classifier/uri_classifier.c +++ b/projects/mongrel_experimental/ext/uri_classifier/uri_classifier.c @@ -10,359 +10,12 @@ #include "tst.h" static VALUE mMongrel; -static VALUE cHttpParser; static VALUE cURIClassifier; -static VALUE eHttpParserError; #define id_handler_map rb_intern("@handler_map") -#define id_http_body rb_intern("@http_body") - -static VALUE global_http_prefix; -static VALUE global_request_method; -static VALUE global_request_uri; -static VALUE global_fragment; -static VALUE global_query_string; -static VALUE global_http_version; -static VALUE global_content_length; -static VALUE global_http_content_length; -static VALUE global_request_path; -static VALUE global_content_type; -static VALUE global_http_content_type; -static VALUE global_gateway_interface; -static VALUE global_gateway_interface_value; -static VALUE global_server_name; -static VALUE global_server_port; -static VALUE global_server_protocol; -static VALUE global_server_protocol_value; -static VALUE global_http_host; -static VALUE global_mongrel_version; -static VALUE global_server_software; -static VALUE global_port_80; #define TRIE_INCREASE 30 -/** Defines common length and error messages for input length validation. */ -#define DEF_MAX_LENGTH(N,length) const size_t MAX_##N##_LENGTH = length; const char *MAX_##N##_LENGTH_ERR = "HTTP element " # N " is longer than the " # length " allowed length." - -/** Validates the max length of given input and throws an HttpParserError exception if over. */ -#define VALIDATE_MAX_LENGTH(len, N) if(len > MAX_##N##_LENGTH) { rb_raise(eHttpParserError, MAX_##N##_LENGTH_ERR); } - -/** Defines global strings in the init method. */ -#define DEF_GLOBAL(N, val) global_##N = rb_obj_freeze(rb_str_new2(val)); rb_global_variable(&global_##N) - - -/* Defines the maximum allowed lengths for various input elements.*/ -DEF_MAX_LENGTH(FIELD_NAME, 256); -DEF_MAX_LENGTH(FIELD_VALUE, 80 * 1024); -DEF_MAX_LENGTH(REQUEST_URI, 1024 * 12); -DEF_MAX_LENGTH(FRAGMENT, 1024); /* Don't know if this length is specified somewhere or not */ -DEF_MAX_LENGTH(REQUEST_PATH, 1024); -DEF_MAX_LENGTH(QUERY_STRING, (1024 * 10)); -DEF_MAX_LENGTH(HEADER, (1024 * (80 + 32))); - - -void http_field(void *data, const char *field, size_t flen, const char *value, size_t vlen) -{ - char *ch, *end; - VALUE req = (VALUE)data; - VALUE v = Qnil; - VALUE f = Qnil; - - VALIDATE_MAX_LENGTH(flen, FIELD_NAME); - VALIDATE_MAX_LENGTH(vlen, FIELD_VALUE); - - v = rb_str_new(value, vlen); - f = rb_str_dup(global_http_prefix); - f = rb_str_buf_cat(f, field, flen); - - for(ch = RSTRING(f)->ptr, end = ch + RSTRING(f)->len; ch < end; ch++) { - if(*ch == '-') { - *ch = '_'; - } else { - *ch = toupper(*ch); - } - } - - rb_hash_aset(req, f, v); -} - -void request_method(void *data, const char *at, size_t length) -{ - VALUE req = (VALUE)data; - VALUE val = Qnil; - - val = rb_str_new(at, length); - rb_hash_aset(req, global_request_method, val); -} - -void request_uri(void *data, const char *at, size_t length) -{ - VALUE req = (VALUE)data; - VALUE val = Qnil; - - VALIDATE_MAX_LENGTH(length, REQUEST_URI); - - val = rb_str_new(at, length); - rb_hash_aset(req, global_request_uri, val); -} - -void fragment(void *data, const char *at, size_t length) -{ - VALUE req = (VALUE)data; - VALUE val = Qnil; - - VALIDATE_MAX_LENGTH(length, FRAGMENT); - - val = rb_str_new(at, length); - rb_hash_aset(req, global_fragment, val); -} - -void request_path(void *data, const char *at, size_t length) -{ - VALUE req = (VALUE)data; - VALUE val = Qnil; - - VALIDATE_MAX_LENGTH(length, REQUEST_PATH); - - val = rb_str_new(at, length); - rb_hash_aset(req, global_request_path, val); -} - -void query_string(void *data, const char *at, size_t length) -{ - VALUE req = (VALUE)data; - VALUE val = Qnil; - - VALIDATE_MAX_LENGTH(length, QUERY_STRING); - - val = rb_str_new(at, length); - rb_hash_aset(req, global_query_string, val); -} - -void http_version(void *data, const char *at, size_t length) -{ - VALUE req = (VALUE)data; - VALUE val = rb_str_new(at, length); - rb_hash_aset(req, global_http_version, val); -} - -/** Finalizes the request header to have a bunch of stuff that's - needed. */ - -void header_done(void *data, const char *at, size_t length) -{ - VALUE req = (VALUE)data; - VALUE temp = Qnil; - VALUE ctype = Qnil; - VALUE clen = Qnil; - char *colon = NULL; - - clen = rb_hash_aref(req, global_http_content_length); - if(clen != Qnil) { - rb_hash_aset(req, global_content_length, clen); - } - - ctype = rb_hash_aref(req, global_http_content_type); - if(ctype != Qnil) { - rb_hash_aset(req, global_content_type, ctype); - } - - rb_hash_aset(req, global_gateway_interface, global_gateway_interface_value); - if((temp = rb_hash_aref(req, global_http_host)) != Qnil) { - /* ruby better close strings off with a '\0' dammit */ - colon = strchr(RSTRING(temp)->ptr, ':'); - if(colon != NULL) { - rb_hash_aset(req, global_server_name, rb_str_substr(temp, 0, colon - RSTRING(temp)->ptr)); - rb_hash_aset(req, global_server_port, - rb_str_substr(temp, colon - RSTRING(temp)->ptr+1, - RSTRING(temp)->len)); - } else { - rb_hash_aset(req, global_server_name, temp); - rb_hash_aset(req, global_server_port, global_port_80); - } - } - - /* grab the initial body and stuff it into an ivar */ - rb_ivar_set(req, id_http_body, rb_str_new(at, length)); - rb_hash_aset(req, global_server_protocol, global_server_protocol_value); - rb_hash_aset(req, global_server_software, global_mongrel_version); -} - - -void HttpParser_free(void *data) { - TRACE(); - - if(data) { - free(data); - } -} - - -VALUE HttpParser_alloc(VALUE klass) -{ - VALUE obj; - http_parser *hp = ALLOC_N(http_parser, 1); - TRACE(); - hp->http_field = http_field; - hp->request_method = request_method; - hp->request_uri = request_uri; - hp->fragment = fragment; - hp->request_path = request_path; - hp->query_string = query_string; - hp->http_version = http_version; - hp->header_done = header_done; - http_parser_init(hp); - - obj = Data_Wrap_Struct(klass, NULL, HttpParser_free, hp); - - return obj; -} - - -/** - * call-seq: - * parser.new -> parser - * - * Creates a new parser. - */ -VALUE HttpParser_init(VALUE self) -{ - http_parser *http = NULL; - DATA_GET(self, http_parser, http); - http_parser_init(http); - - return self; -} - - -/** - * call-seq: - * parser.reset -> nil - * - * Resets the parser to it's initial state so that you can reuse it - * rather than making new ones. - */ -VALUE HttpParser_reset(VALUE self) -{ - http_parser *http = NULL; - DATA_GET(self, http_parser, http); - http_parser_init(http); - - return Qnil; -} - - -/** - * call-seq: - * parser.finish -> true/false - * - * Finishes a parser early which could put in a "good" or bad state. - * You should call reset after finish it or bad things will happen. - */ -VALUE HttpParser_finish(VALUE self) -{ - http_parser *http = NULL; - DATA_GET(self, http_parser, http); - http_parser_finish(http); - - return http_parser_is_finished(http) ? Qtrue : Qfalse; -} - - -/** - * call-seq: - * parser.execute(req_hash, data, start) -> Integer - * - * Takes a Hash and a String of data, parses the String of data filling in the Hash - * returning an Integer to indicate how much of the data has been read. No matter - * what the return value, you should call HttpParser#finished? and HttpParser#error? - * to figure out if it's done parsing or there was an error. - * - * This function now throws an exception when there is a parsing error. This makes - * the logic for working with the parser much easier. You can still test for an - * error, but now you need to wrap the parser with an exception handling block. - * - * The third argument allows for parsing a partial request and then continuing - * the parsing from that position. It needs all of the original data as well - * so you have to append to the data buffer as you read. - */ -VALUE HttpParser_execute(VALUE self, VALUE req_hash, VALUE data, VALUE start) -{ - http_parser *http = NULL; - int from = 0; - char *dptr = NULL; - long dlen = 0; - - DATA_GET(self, http_parser, http); - - from = FIX2INT(start); - dptr = RSTRING(data)->ptr; - dlen = RSTRING(data)->len; - - if(from >= dlen) { - rb_raise(eHttpParserError, "Requested start is after data buffer end."); - } else { - http->data = (void *)req_hash; - http_parser_execute(http, dptr, dlen, from); - - VALIDATE_MAX_LENGTH(http_parser_nread(http), HEADER); - - if(http_parser_has_error(http)) { - rb_raise(eHttpParserError, "Invalid HTTP format, parsing fails."); - } else { - return INT2FIX(http_parser_nread(http)); - } - } -} - - - -/** - * call-seq: - * parser.error? -> true/false - * - * Tells you whether the parser is in an error state. - */ -VALUE HttpParser_has_error(VALUE self) -{ - http_parser *http = NULL; - DATA_GET(self, http_parser, http); - - return http_parser_has_error(http) ? Qtrue : Qfalse; -} - - -/** - * call-seq: - * parser.finished? -> true/false - * - * Tells you whether the parser is finished or not and in a good state. - */ -VALUE HttpParser_is_finished(VALUE self) -{ - http_parser *http = NULL; - DATA_GET(self, http_parser, http); - - return http_parser_is_finished(http) ? Qtrue : Qfalse; -} - - -/** - * call-seq: - * parser.nread -> Integer - * - * Returns the amount of data processed so far during this processing cycle. It is - * set to 0 on initialize or reset calls and is incremented each time execute is called. - */ -VALUE HttpParser_nread(VALUE self) -{ - http_parser *http = NULL; - DATA_GET(self, http_parser, http); - - return INT2FIX(http->nread); -} - - void URIClassifier_free(void *data) { TRACE(); @@ -372,8 +25,6 @@ void URIClassifier_free(void *data) } } - - VALUE URIClassifier_alloc(VALUE klass) { VALUE obj;