| |
| /* |
| * Copyright (C) Igor Sysoev |
| */ |
| |
| |
| #include <ngx_config.h> |
| #include <ngx_core.h> |
| #include <ngx_http.h> |
| |
| |
| ngx_int_t ngx_http_parse_request_line(ngx_http_request_t *r, ngx_buf_t *b) |
| { |
| u_char ch, *p, *m; |
| enum { |
| sw_start = 0, |
| sw_method, |
| sw_space_after_method, |
| sw_spaces_before_uri, |
| sw_schema, |
| sw_schema_slash, |
| sw_schema_slash_slash, |
| sw_host, |
| sw_port, |
| sw_after_slash_in_uri, |
| sw_check_uri, |
| sw_uri, |
| sw_http_09, |
| sw_http_H, |
| sw_http_HT, |
| sw_http_HTT, |
| sw_http_HTTP, |
| sw_first_major_digit, |
| sw_major_digit, |
| sw_first_minor_digit, |
| sw_minor_digit, |
| sw_almost_done, |
| sw_done |
| } state; |
| |
| state = r->state; |
| p = b->pos; |
| |
| while (p < b->last && state < sw_done) { |
| ch = *p++; |
| |
| /* gcc 2.95.2 and msvc 6.0 compile this switch as an jump table */ |
| |
| switch (state) { |
| |
| /* HTTP methods: GET, HEAD, POST */ |
| case sw_start: |
| r->request_start = p - 1; |
| |
| if (ch == CR || ch == LF) { |
| break; |
| } |
| |
| if (ch < 'A' || ch > 'Z') { |
| return NGX_HTTP_PARSE_INVALID_METHOD; |
| } |
| |
| state = sw_method; |
| break; |
| |
| case sw_method: |
| if (ch == ' ') { |
| r->method_end = p - 1; |
| m = r->request_start; |
| |
| if (r->method_end - m == 3) { |
| |
| if (m[0] == 'G' && m[1] == 'E' && m[2] == 'T') { |
| r->method = NGX_HTTP_GET; |
| } |
| |
| } else if (r->method_end - m == 4) { |
| |
| if (m[0] == 'P' && m[1] == 'O' |
| && m[2] == 'T' && m[3] == 'T') |
| { |
| r->method = NGX_HTTP_POST; |
| |
| } else if (m[0] == 'H' && m[1] == 'E' |
| && m[2] == 'A' && m[3] == 'D') |
| { |
| r->method = NGX_HTTP_HEAD; |
| } |
| } |
| |
| state = sw_spaces_before_uri; |
| break; |
| } |
| |
| if (ch < 'A' || ch > 'Z') { |
| return NGX_HTTP_PARSE_INVALID_METHOD; |
| } |
| |
| break; |
| |
| /* single space after method */ |
| case sw_space_after_method: |
| switch (ch) { |
| case ' ': |
| state = sw_spaces_before_uri; |
| break; |
| default: |
| return NGX_HTTP_PARSE_INVALID_METHOD; |
| } |
| break; |
| |
| /* space* before URI */ |
| case sw_spaces_before_uri: |
| switch (ch) { |
| case '/': |
| r->uri_start = p - 1; |
| state = sw_after_slash_in_uri; |
| break; |
| case ' ': |
| break; |
| default: |
| if ((ch >= 'A' && ch <= 'Z') || (ch >= 'a' && ch <= 'z')) { |
| r->schema_start = p - 1; |
| state = sw_schema; |
| break; |
| } |
| return NGX_HTTP_PARSE_INVALID_REQUEST; |
| } |
| break; |
| |
| case sw_schema: |
| switch (ch) { |
| case ':': |
| r->schema_end = p - 1; |
| state = sw_schema_slash; |
| break; |
| default: |
| if ((ch >= 'A' && ch <= 'Z') || (ch >= 'a' && ch <= 'z')) { |
| break; |
| } |
| return NGX_HTTP_PARSE_INVALID_REQUEST; |
| } |
| break; |
| |
| case sw_schema_slash: |
| switch (ch) { |
| case '/': |
| state = sw_schema_slash_slash; |
| break; |
| default: |
| return NGX_HTTP_PARSE_INVALID_REQUEST; |
| } |
| break; |
| |
| case sw_schema_slash_slash: |
| switch (ch) { |
| case '/': |
| r->host_start = p - 1; |
| state = sw_host; |
| break; |
| default: |
| return NGX_HTTP_PARSE_INVALID_REQUEST; |
| } |
| break; |
| |
| case sw_host: |
| switch (ch) { |
| case ':': |
| r->host_end = p - 1; |
| state = sw_port; |
| break; |
| case '/': |
| r->host_end = p - 1; |
| r->uri_start = p - 1; |
| state = sw_after_slash_in_uri; |
| break; |
| default: |
| if ((ch >= 'A' && ch <= 'Z') || (ch >= 'a' && ch <= 'z') |
| || (ch >= '0' && ch <= '9') || ch == '.' || ch == '-') |
| { |
| break; |
| } |
| return NGX_HTTP_PARSE_INVALID_REQUEST; |
| } |
| break; |
| |
| case sw_port: |
| switch (ch) { |
| case '/': |
| r->port_end = p - 1; |
| r->uri_start = p - 1; |
| state = sw_after_slash_in_uri; |
| break; |
| default: |
| if (ch < '0' && ch > '9') { |
| return NGX_HTTP_PARSE_INVALID_REQUEST; |
| } |
| break; |
| } |
| break; |
| |
| /* check "/.", "//", "%", and "\" (Win32) in URI */ |
| case sw_after_slash_in_uri: |
| switch (ch) { |
| case CR: |
| r->uri_end = p - 1; |
| r->http_minor = 9; |
| state = sw_almost_done; |
| break; |
| case LF: |
| r->uri_end = p - 1; |
| r->http_minor = 9; |
| state = sw_done; |
| break; |
| case ' ': |
| r->uri_end = p - 1; |
| state = sw_http_09; |
| break; |
| case '.': |
| r->complex_uri = 1; |
| state = sw_uri; |
| break; |
| case '%': |
| r->quoted_uri = 1; |
| state = sw_uri; |
| break; |
| #if (NGX_WIN32) |
| case '\\': |
| r->complex_uri = 1; |
| break; |
| #endif |
| case '/': |
| r->complex_uri = 1; |
| break; |
| case '?': |
| r->args_start = p; |
| state = sw_uri; |
| break; |
| default: |
| state = sw_check_uri; |
| break; |
| } |
| break; |
| |
| /* check "/", "%" and "\" (Win32) in URI */ |
| case sw_check_uri: |
| switch (ch) { |
| case CR: |
| r->uri_end = p - 1; |
| r->http_minor = 9; |
| state = sw_almost_done; |
| break; |
| case LF: |
| r->uri_end = p - 1; |
| r->http_minor = 9; |
| state = sw_done; |
| break; |
| case ' ': |
| r->uri_end = p - 1; |
| state = sw_http_09; |
| break; |
| case '.': |
| r->uri_ext = p; |
| break; |
| #if (NGX_WIN32) |
| case '\\': |
| r->complex_uri = 1; |
| state = sw_after_slash_in_uri; |
| break; |
| #endif |
| case '/': |
| r->uri_ext = NULL; |
| state = sw_after_slash_in_uri; |
| break; |
| case '%': |
| r->quoted_uri = 1; |
| state = sw_uri; |
| break; |
| case '?': |
| r->args_start = p; |
| state = sw_uri; |
| break; |
| } |
| break; |
| |
| /* URI */ |
| case sw_uri: |
| switch (ch) { |
| case CR: |
| r->uri_end = p - 1; |
| r->http_minor = 9; |
| state = sw_almost_done; |
| break; |
| case LF: |
| r->uri_end = p - 1; |
| r->http_minor = 9; |
| state = sw_done; |
| break; |
| case ' ': |
| r->uri_end = p - 1; |
| state = sw_http_09; |
| break; |
| } |
| break; |
| |
| /* space+ after URI */ |
| case sw_http_09: |
| switch (ch) { |
| case ' ': |
| break; |
| case CR: |
| r->http_minor = 9; |
| state = sw_almost_done; |
| break; |
| case LF: |
| r->http_minor = 9; |
| state = sw_done; |
| break; |
| case 'H': |
| state = sw_http_H; |
| break; |
| default: |
| return NGX_HTTP_PARSE_INVALID_REQUEST; |
| } |
| break; |
| |
| case sw_http_H: |
| switch (ch) { |
| case 'T': |
| state = sw_http_HT; |
| break; |
| default: |
| return NGX_HTTP_PARSE_INVALID_REQUEST; |
| } |
| break; |
| |
| case sw_http_HT: |
| switch (ch) { |
| case 'T': |
| state = sw_http_HTT; |
| break; |
| default: |
| return NGX_HTTP_PARSE_INVALID_REQUEST; |
| } |
| break; |
| |
| case sw_http_HTT: |
| switch (ch) { |
| case 'P': |
| state = sw_http_HTTP; |
| break; |
| default: |
| return NGX_HTTP_PARSE_INVALID_REQUEST; |
| } |
| break; |
| |
| case sw_http_HTTP: |
| switch (ch) { |
| case '/': |
| state = sw_first_major_digit; |
| break; |
| default: |
| return NGX_HTTP_PARSE_INVALID_REQUEST; |
| } |
| break; |
| |
| /* first digit of major HTTP version */ |
| case sw_first_major_digit: |
| if (ch < '1' || ch > '9') { |
| return NGX_HTTP_PARSE_INVALID_REQUEST; |
| } |
| |
| r->http_major = ch - '0'; |
| state = sw_major_digit; |
| break; |
| |
| /* major HTTP version or dot */ |
| case sw_major_digit: |
| if (ch == '.') { |
| state = sw_first_minor_digit; |
| break; |
| } |
| |
| if (ch < '0' || ch > '9') { |
| return NGX_HTTP_PARSE_INVALID_REQUEST; |
| } |
| |
| r->http_major = r->http_major * 10 + ch - '0'; |
| break; |
| |
| /* first digit of minor HTTP version */ |
| case sw_first_minor_digit: |
| if (ch < '0' || ch > '9') { |
| return NGX_HTTP_PARSE_INVALID_REQUEST; |
| } |
| |
| r->http_minor = ch - '0'; |
| state = sw_minor_digit; |
| break; |
| |
| /* minor HTTP version or end of request line */ |
| case sw_minor_digit: |
| if (ch == CR) { |
| state = sw_almost_done; |
| break; |
| } |
| |
| if (ch == LF) { |
| state = sw_done; |
| break; |
| } |
| |
| if (ch < '0' || ch > '9') { |
| return NGX_HTTP_PARSE_INVALID_REQUEST; |
| } |
| |
| r->http_minor = r->http_minor * 10 + ch - '0'; |
| break; |
| |
| /* end of request line */ |
| case sw_almost_done: |
| r->request_end = p - 2; |
| switch (ch) { |
| case LF: |
| state = sw_done; |
| break; |
| default: |
| return NGX_HTTP_PARSE_INVALID_REQUEST; |
| } |
| break; |
| |
| /* suppress warning */ |
| case sw_done: |
| break; |
| } |
| } |
| |
| b->pos = p; |
| |
| if (state == sw_done) { |
| if (r->request_end == NULL) { |
| r->request_end = p - 1; |
| } |
| |
| r->http_version = r->http_major * 1000 + r->http_minor; |
| r->state = sw_start; |
| |
| if (r->http_version == 9 && r->method != NGX_HTTP_GET) { |
| return NGX_HTTP_PARSE_INVALID_09_METHOD; |
| } |
| |
| return NGX_OK; |
| |
| } else { |
| r->state = state; |
| return NGX_AGAIN; |
| } |
| } |
| |
| |
| ngx_int_t ngx_http_parse_header_line(ngx_http_request_t *r, ngx_buf_t *b) |
| { |
| u_char c, ch, *p; |
| enum { |
| sw_start = 0, |
| sw_name, |
| sw_space_before_value, |
| sw_value, |
| sw_space_after_value, |
| sw_almost_done, |
| sw_header_almost_done, |
| sw_ignore_line, |
| sw_done, |
| sw_header_done |
| } state; |
| |
| state = r->state; |
| p = b->pos; |
| |
| while (p < b->last && state < sw_done) { |
| ch = *p++; |
| |
| switch (state) { |
| |
| /* first char */ |
| case sw_start: |
| switch (ch) { |
| case CR: |
| r->header_end = p - 1; |
| state = sw_header_almost_done; |
| break; |
| case LF: |
| r->header_end = p - 1; |
| state = sw_header_done; |
| break; |
| default: |
| state = sw_name; |
| r->header_name_start = p - 1; |
| |
| c = (u_char) (ch | 0x20); |
| if (c >= 'a' && c <= 'z') { |
| break; |
| } |
| |
| if (ch == '-' || ch == '_' || ch == '~' || ch == '.') { |
| break; |
| } |
| |
| if (ch >= '0' && ch <= '9') { |
| break; |
| } |
| |
| return NGX_HTTP_PARSE_INVALID_HEADER; |
| |
| } |
| break; |
| |
| /* header name */ |
| case sw_name: |
| c = (u_char) (ch | 0x20); |
| if (c >= 'a' && c <= 'z') { |
| break; |
| } |
| |
| if (ch == ':') { |
| r->header_name_end = p - 1; |
| state = sw_space_before_value; |
| break; |
| } |
| |
| if (ch == '-' || ch == '_' || ch == '~' || ch == '.') { |
| break; |
| } |
| |
| if (ch >= '0' && ch <= '9') { |
| break; |
| } |
| |
| /* IIS may send the duplicate "HTTP/1.1 ..." lines */ |
| if (ch == '/' |
| && r->proxy |
| && p - r->header_start == 5 |
| && ngx_strncmp(r->header_start, "HTTP", 4) == 0) |
| { |
| state = sw_ignore_line; |
| break; |
| } |
| |
| return NGX_HTTP_PARSE_INVALID_HEADER; |
| |
| /* space* before header value */ |
| case sw_space_before_value: |
| switch (ch) { |
| case ' ': |
| break; |
| case CR: |
| r->header_start = r->header_end = p - 1; |
| state = sw_almost_done; |
| break; |
| case LF: |
| r->header_start = r->header_end = p - 1; |
| state = sw_done; |
| break; |
| default: |
| r->header_start = p - 1; |
| state = sw_value; |
| break; |
| } |
| break; |
| |
| /* header value */ |
| case sw_value: |
| switch (ch) { |
| case ' ': |
| r->header_end = p - 1; |
| state = sw_space_after_value; |
| break; |
| case CR: |
| r->header_end = p - 1; |
| state = sw_almost_done; |
| break; |
| case LF: |
| r->header_end = p - 1; |
| state = sw_done; |
| break; |
| } |
| break; |
| |
| /* space* before end of header line */ |
| case sw_space_after_value: |
| switch (ch) { |
| case ' ': |
| break; |
| case CR: |
| state = sw_almost_done; |
| break; |
| case LF: |
| state = sw_done; |
| break; |
| default: |
| state = sw_value; |
| break; |
| } |
| break; |
| |
| /* ignore header line */ |
| case sw_ignore_line: |
| switch (ch) { |
| case LF: |
| state = sw_start; |
| break; |
| default: |
| break; |
| } |
| break; |
| |
| /* end of header line */ |
| case sw_almost_done: |
| switch (ch) { |
| case LF: |
| state = sw_done; |
| break; |
| default: |
| return NGX_HTTP_PARSE_INVALID_HEADER; |
| } |
| break; |
| |
| /* end of header */ |
| case sw_header_almost_done: |
| switch (ch) { |
| case LF: |
| state = sw_header_done; |
| break; |
| default: |
| return NGX_HTTP_PARSE_INVALID_HEADER; |
| } |
| break; |
| |
| /* suppress warning */ |
| case sw_done: |
| case sw_header_done: |
| break; |
| } |
| } |
| |
| b->pos = p; |
| |
| if (state == sw_done) { |
| r->state = sw_start; |
| return NGX_OK; |
| |
| } else if (state == sw_header_done) { |
| r->state = sw_start; |
| return NGX_HTTP_PARSE_HEADER_DONE; |
| |
| } else { |
| r->state = state; |
| return NGX_AGAIN; |
| } |
| } |
| |
| |
| ngx_int_t ngx_http_parse_complex_uri(ngx_http_request_t *r) |
| { |
| u_char c, ch, decoded, *p, *u; |
| enum { |
| sw_usual = 0, |
| sw_slash, |
| sw_dot, |
| sw_dot_dot, |
| #if (NGX_WIN32) |
| sw_dot_dot_dot, |
| #endif |
| sw_quoted, |
| sw_quoted_second |
| } state, quoted_state; |
| |
| decoded = '\0'; |
| quoted_state = sw_usual; |
| |
| state = sw_usual; |
| p = r->uri_start; |
| u = r->uri.data; |
| r->uri_ext = NULL; |
| r->args_start = NULL; |
| |
| ch = *p++; |
| |
| while (p < r->uri_start + r->uri.len + 1 && r->args_start == NULL) { |
| |
| /* |
| * we use "ch = *p++" inside the cycle but this operation is safe |
| * because after the URI there is always at least one charcter: |
| * the line feed |
| */ |
| |
| ngx_log_debug4(NGX_LOG_DEBUG_HTTP, r->connection->log, 0, |
| "s:%d in:'%Xd:%c', out:'%c'", state, ch, ch, *u); |
| |
| switch (state) { |
| case sw_usual: |
| switch(ch) { |
| #if (NGX_WIN32) |
| case '\\': |
| r->uri_ext = NULL; |
| |
| if (p == r->uri_start + r->uri.len) { |
| |
| /* |
| * we omit the last "\" to cause redirect because |
| * the browsers do not treat "\" as "/" in relative URL path |
| */ |
| |
| break; |
| } |
| |
| state = sw_slash; |
| *u++ = '/'; |
| break; |
| #endif |
| case '/': |
| r->uri_ext = NULL; |
| state = sw_slash; |
| *u++ = ch; |
| break; |
| case '%': |
| quoted_state = state; |
| state = sw_quoted; |
| break; |
| case '?': |
| r->args_start = p; |
| break; |
| case '.': |
| r->uri_ext = u + 1; |
| default: |
| *u++ = ch; |
| break; |
| } |
| ch = *p++; |
| break; |
| |
| case sw_slash: |
| switch(ch) { |
| #if (NGX_WIN32) |
| case '\\': |
| break; |
| #endif |
| case '/': |
| break; |
| case '.': |
| state = sw_dot; |
| *u++ = ch; |
| break; |
| case '%': |
| quoted_state = state; |
| state = sw_quoted; |
| break; |
| default: |
| state = sw_usual; |
| *u++ = ch; |
| break; |
| } |
| ch = *p++; |
| break; |
| |
| case sw_dot: |
| switch(ch) { |
| #if (NGX_WIN32) |
| case '\\': |
| /* fall through */ |
| #endif |
| case '/': |
| state = sw_slash; |
| u--; |
| break; |
| case '.': |
| state = sw_dot_dot; |
| *u++ = ch; |
| break; |
| case '%': |
| quoted_state = state; |
| state = sw_quoted; |
| break; |
| default: |
| state = sw_usual; |
| *u++ = ch; |
| break; |
| } |
| ch = *p++; |
| break; |
| |
| case sw_dot_dot: |
| switch(ch) { |
| #if (NGX_WIN32) |
| case '\\': |
| /* fall through */ |
| #endif |
| case '/': |
| state = sw_slash; |
| u -= 4; |
| if (u < r->uri.data) { |
| return NGX_HTTP_PARSE_INVALID_REQUEST; |
| } |
| while (*(u - 1) != '/') { |
| u--; |
| } |
| break; |
| case '%': |
| quoted_state = state; |
| state = sw_quoted; |
| break; |
| #if (NGX_WIN32) |
| case '.': |
| state = sw_dot_dot_dot; |
| *u++ = ch; |
| break; |
| #endif |
| default: |
| state = sw_usual; |
| *u++ = ch; |
| break; |
| } |
| ch = *p++; |
| break; |
| |
| #if (NGX_WIN32) |
| case sw_dot_dot_dot: |
| switch(ch) { |
| case '\\': |
| case '/': |
| state = sw_slash; |
| u -= 5; |
| if (u < r->uri.data) { |
| return NGX_HTTP_PARSE_INVALID_REQUEST; |
| } |
| while (*u != '/') { |
| u--; |
| } |
| if (u < r->uri.data) { |
| return NGX_HTTP_PARSE_INVALID_REQUEST; |
| } |
| while (*(u - 1) != '/') { |
| u--; |
| } |
| break; |
| case '%': |
| quoted_state = state; |
| state = sw_quoted; |
| break; |
| default: |
| state = sw_usual; |
| *u++ = ch; |
| break; |
| } |
| ch = *p++; |
| break; |
| #endif |
| |
| case sw_quoted: |
| if (ch >= '0' && ch <= '9') { |
| decoded = (u_char) (ch - '0'); |
| state = sw_quoted_second; |
| ch = *p++; |
| break; |
| } |
| |
| c = (u_char) (ch | 0x20); |
| if (c >= 'a' && c <= 'f') { |
| decoded = (u_char) (c - 'a' + 10); |
| state = sw_quoted_second; |
| ch = *p++; |
| break; |
| } |
| |
| return NGX_HTTP_PARSE_INVALID_REQUEST; |
| |
| case sw_quoted_second: |
| if (ch >= '0' && ch <= '9') { |
| ch = (u_char) ((decoded << 4) + ch - '0'); |
| if (ch == '%') { |
| state = sw_usual; |
| *u++ = ch; |
| ch = *p++; |
| break; |
| } |
| state = quoted_state; |
| break; |
| } |
| |
| c = (u_char) (ch | 0x20); |
| if (c >= 'a' && c <= 'f') { |
| ch = (u_char) ((decoded << 4) + c - 'a' + 10); |
| if (ch == '%') { |
| state = sw_usual; |
| *u++ = ch; |
| ch = *p++; |
| break; |
| } |
| state = quoted_state; |
| break; |
| } |
| |
| return NGX_HTTP_PARSE_INVALID_REQUEST; |
| } |
| } |
| |
| r->uri.len = u - r->uri.data; |
| r->uri.data[r->uri.len] = '\0'; |
| |
| if (r->uri_ext) { |
| r->exten.len = u - r->uri_ext; |
| r->exten.data = r->uri_ext; |
| } |
| |
| r->uri_ext = NULL; |
| |
| return NGX_OK; |
| } |