blob: ddd8d77e6907641bcbaa6ee5420c4aa226a047fc [file] [log] [blame]
Igor Sysoev0c331d92002-08-15 17:20:26 +00001
Igor Sysoevd90282d2004-09-28 08:34:51 +00002/*
Igor Sysoevff8da912004-09-29 16:00:49 +00003 * Copyright (C) Igor Sysoev
Igor Sysoevd90282d2004-09-28 08:34:51 +00004 */
5
6
Igor Sysoev0c331d92002-08-15 17:20:26 +00007#include <ngx_config.h>
Igor Sysoev016b8522002-08-29 16:59:54 +00008#include <ngx_core.h>
Igor Sysoev0c331d92002-08-15 17:20:26 +00009#include <ngx_http.h>
10
Igor Sysoev59cf56c2004-09-07 15:29:22 +000011
Igor Sysoev3338cfd2006-05-11 14:43:47 +000012/* gcc, icc, msvc and others compile these switches as an jump table */
13
Igor Sysoev899b44e2005-05-12 14:58:06 +000014ngx_int_t
15ngx_http_parse_request_line(ngx_http_request_t *r, ngx_buf_t *b)
Igor Sysoev0c331d92002-08-15 17:20:26 +000016{
Igor Sysoev02f742b2005-04-08 15:18:55 +000017 u_char c, ch, *p, *m;
Igor Sysoev0c331d92002-08-15 17:20:26 +000018 enum {
Igor Sysoev016b8522002-08-29 16:59:54 +000019 sw_start = 0,
Igor Sysoeva3677242004-04-14 05:57:36 +000020 sw_method,
Igor Sysoev016b8522002-08-29 16:59:54 +000021 sw_space_after_method,
22 sw_spaces_before_uri,
Igor Sysoeva3677242004-04-14 05:57:36 +000023 sw_schema,
24 sw_schema_slash,
25 sw_schema_slash_slash,
26 sw_host,
27 sw_port,
Igor Sysoev016b8522002-08-29 16:59:54 +000028 sw_after_slash_in_uri,
29 sw_check_uri,
30 sw_uri,
31 sw_http_09,
Igor Sysoeva9830112003-05-19 16:39:14 +000032 sw_http_H,
33 sw_http_HT,
34 sw_http_HTT,
35 sw_http_HTTP,
Igor Sysoev016b8522002-08-29 16:59:54 +000036 sw_first_major_digit,
37 sw_major_digit,
38 sw_first_minor_digit,
39 sw_minor_digit,
Igor Sysoev02025fd2005-01-18 13:03:58 +000040 sw_almost_done
Igor Sysoev481b6432002-12-04 16:29:40 +000041 } state;
42
43 state = r->state;
Igor Sysoev0c331d92002-08-15 17:20:26 +000044
Igor Sysoev02025fd2005-01-18 13:03:58 +000045 for (p = b->pos; p < b->last; p++) {
46 ch = *p;
Igor Sysoev0c331d92002-08-15 17:20:26 +000047
Igor Sysoev0c331d92002-08-15 17:20:26 +000048 switch (state) {
49
50 /* HTTP methods: GET, HEAD, POST */
Igor Sysoev016b8522002-08-29 16:59:54 +000051 case sw_start:
Igor Sysoev02025fd2005-01-18 13:03:58 +000052 r->request_start = p;
Igor Sysoev3d062ad2003-03-05 06:37:42 +000053
Igor Sysoev732a2712004-04-21 18:54:33 +000054 if (ch == CR || ch == LF) {
55 break;
56 }
57
Igor Sysoeva3677242004-04-14 05:57:36 +000058 if (ch < 'A' || ch > 'Z') {
Igor Sysoev1af7c822002-09-13 14:47:42 +000059 return NGX_HTTP_PARSE_INVALID_METHOD;
Igor Sysoev0c331d92002-08-15 17:20:26 +000060 }
Igor Sysoeva3677242004-04-14 05:57:36 +000061
62 state = sw_method;
Igor Sysoeva9830112003-05-19 16:39:14 +000063 break;
Igor Sysoev0c331d92002-08-15 17:20:26 +000064
Igor Sysoeva3677242004-04-14 05:57:36 +000065 case sw_method:
66 if (ch == ' ') {
Igor Sysoev899b44e2005-05-12 14:58:06 +000067 r->method_end = p - 1;
Igor Sysoeva3677242004-04-14 05:57:36 +000068 m = r->request_start;
Igor Sysoeva9830112003-05-19 16:39:14 +000069
Igor Sysoev4ecb4d72006-04-21 12:06:44 +000070 switch (p - m) {
Igor Sysoeva9830112003-05-19 16:39:14 +000071
Igor Sysoev4ecb4d72006-04-21 12:06:44 +000072 case 3:
Igor Sysoev2e6ba932004-09-09 15:40:48 +000073 if (m[0] == 'G' && m[1] == 'E' && m[2] == 'T') {
Igor Sysoeva3677242004-04-14 05:57:36 +000074 r->method = NGX_HTTP_GET;
Igor Sysoev8a2b2fb2006-04-14 09:53:38 +000075
76 } else if (m[0] == 'P' && m[1] == 'U' && m[2] == 'T') {
77 r->method = NGX_HTTP_PUT;
Igor Sysoeva3677242004-04-14 05:57:36 +000078 }
Igor Sysoev4ecb4d72006-04-21 12:06:44 +000079 break;
Igor Sysoeva9830112003-05-19 16:39:14 +000080
Igor Sysoev4ecb4d72006-04-21 12:06:44 +000081 case 4:
Igor Sysoev2e6ba932004-09-09 15:40:48 +000082 if (m[0] == 'P' && m[1] == 'O'
Igor Sysoev02025fd2005-01-18 13:03:58 +000083 && m[2] == 'S' && m[3] == 'T')
Igor Sysoeva3677242004-04-14 05:57:36 +000084 {
85 r->method = NGX_HTTP_POST;
Igor Sysoeva9830112003-05-19 16:39:14 +000086
Igor Sysoev2e6ba932004-09-09 15:40:48 +000087 } else if (m[0] == 'H' && m[1] == 'E'
88 && m[2] == 'A' && m[3] == 'D')
Igor Sysoeva3677242004-04-14 05:57:36 +000089 {
90 r->method = NGX_HTTP_HEAD;
91 }
Igor Sysoev4ecb4d72006-04-21 12:06:44 +000092 break;
Igor Sysoev8a2b2fb2006-04-14 09:53:38 +000093
Igor Sysoev4ecb4d72006-04-21 12:06:44 +000094 case 5:
Igor Sysoev7bdb7202006-04-19 15:30:56 +000095 if (m[0] == 'M' && m[1] == 'K'
96 && m[2] == 'C' && m[3] == 'O' && m[4] == 'L')
97 {
98 r->method = NGX_HTTP_MKCOL;
99 }
Igor Sysoev4ecb4d72006-04-21 12:06:44 +0000100 break;
Igor Sysoev7bdb7202006-04-19 15:30:56 +0000101
Igor Sysoev4ecb4d72006-04-21 12:06:44 +0000102 case 6:
Igor Sysoev8a2b2fb2006-04-14 09:53:38 +0000103 if (m[0] == 'D' && m[1] == 'E' && m[2] == 'L'
104 && m[3] == 'E' && m[4] == 'T' && m[5] == 'E')
105 {
106 r->method = NGX_HTTP_DELETE;
107 }
Igor Sysoev4ecb4d72006-04-21 12:06:44 +0000108 break;
Igor Sysoeva3677242004-04-14 05:57:36 +0000109 }
Igor Sysoeva9830112003-05-19 16:39:14 +0000110
Igor Sysoeva3677242004-04-14 05:57:36 +0000111 state = sw_spaces_before_uri;
Igor Sysoeva9830112003-05-19 16:39:14 +0000112 break;
Igor Sysoeva9830112003-05-19 16:39:14 +0000113 }
Igor Sysoeva9830112003-05-19 16:39:14 +0000114
Igor Sysoeva3677242004-04-14 05:57:36 +0000115 if (ch < 'A' || ch > 'Z') {
Igor Sysoeva9830112003-05-19 16:39:14 +0000116 return NGX_HTTP_PARSE_INVALID_METHOD;
117 }
Igor Sysoeva3677242004-04-14 05:57:36 +0000118
Igor Sysoev0c331d92002-08-15 17:20:26 +0000119 break;
120
121 /* single space after method */
Igor Sysoev016b8522002-08-29 16:59:54 +0000122 case sw_space_after_method:
Igor Sysoev0c331d92002-08-15 17:20:26 +0000123 switch (ch) {
124 case ' ':
Igor Sysoev016b8522002-08-29 16:59:54 +0000125 state = sw_spaces_before_uri;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000126 break;
127 default:
Igor Sysoev1af7c822002-09-13 14:47:42 +0000128 return NGX_HTTP_PARSE_INVALID_METHOD;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000129 }
130 break;
131
132 /* space* before URI */
Igor Sysoev016b8522002-08-29 16:59:54 +0000133 case sw_spaces_before_uri:
Igor Sysoev02f742b2005-04-08 15:18:55 +0000134
135 c = (u_char) (ch | 0x20);
Igor Sysoev7b190b42005-06-07 15:56:31 +0000136 if (c >= 'a' && c <= 'z') {
Igor Sysoev1ebfead2005-02-16 13:40:36 +0000137 r->schema_start = p;
138 state = sw_schema;
139 break;
140 }
141
Igor Sysoev0c331d92002-08-15 17:20:26 +0000142 switch (ch) {
143 case '/':
Igor Sysoev02025fd2005-01-18 13:03:58 +0000144 r->uri_start = p;
Igor Sysoev016b8522002-08-29 16:59:54 +0000145 state = sw_after_slash_in_uri;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000146 break;
147 case ' ':
148 break;
149 default:
Igor Sysoeva3677242004-04-14 05:57:36 +0000150 return NGX_HTTP_PARSE_INVALID_REQUEST;
151 }
152 break;
153
154 case sw_schema:
Igor Sysoev02f742b2005-04-08 15:18:55 +0000155
156 c = (u_char) (ch | 0x20);
Igor Sysoev7b190b42005-06-07 15:56:31 +0000157 if (c >= 'a' && c <= 'z') {
Igor Sysoev1ebfead2005-02-16 13:40:36 +0000158 break;
159 }
160
Igor Sysoeva3677242004-04-14 05:57:36 +0000161 switch (ch) {
162 case ':':
Igor Sysoev02025fd2005-01-18 13:03:58 +0000163 r->schema_end = p;
Igor Sysoeva3677242004-04-14 05:57:36 +0000164 state = sw_schema_slash;
165 break;
166 default:
Igor Sysoeva3677242004-04-14 05:57:36 +0000167 return NGX_HTTP_PARSE_INVALID_REQUEST;
168 }
169 break;
170
171 case sw_schema_slash:
172 switch (ch) {
173 case '/':
174 state = sw_schema_slash_slash;
175 break;
176 default:
177 return NGX_HTTP_PARSE_INVALID_REQUEST;
178 }
179 break;
180
181 case sw_schema_slash_slash:
182 switch (ch) {
183 case '/':
Igor Sysoev02025fd2005-01-18 13:03:58 +0000184 r->host_start = p;
Igor Sysoeva3677242004-04-14 05:57:36 +0000185 state = sw_host;
186 break;
187 default:
188 return NGX_HTTP_PARSE_INVALID_REQUEST;
189 }
190 break;
191
192 case sw_host:
Igor Sysoev02f742b2005-04-08 15:18:55 +0000193
194 c = (u_char) (ch | 0x20);
Igor Sysoev7b190b42005-06-07 15:56:31 +0000195 if (c >= 'a' && c <= 'z') {
Igor Sysoev02f742b2005-04-08 15:18:55 +0000196 break;
197 }
198
199 if ((ch >= '0' && ch <= '9') || ch == '.' || ch == '-')
Igor Sysoev1ebfead2005-02-16 13:40:36 +0000200 {
201 break;
202 }
203
Igor Sysoeva3677242004-04-14 05:57:36 +0000204 switch (ch) {
205 case ':':
Igor Sysoev02025fd2005-01-18 13:03:58 +0000206 r->host_end = p;
Igor Sysoeva3677242004-04-14 05:57:36 +0000207 state = sw_port;
208 break;
209 case '/':
Igor Sysoev02025fd2005-01-18 13:03:58 +0000210 r->host_end = p;
211 r->uri_start = p;
Igor Sysoeva3677242004-04-14 05:57:36 +0000212 state = sw_after_slash_in_uri;
213 break;
214 default:
Igor Sysoeva3677242004-04-14 05:57:36 +0000215 return NGX_HTTP_PARSE_INVALID_REQUEST;
216 }
217 break;
218
219 case sw_port:
Igor Sysoev1ebfead2005-02-16 13:40:36 +0000220 if (ch >= '0' && ch <= '9') {
221 break;
222 }
223
Igor Sysoeva3677242004-04-14 05:57:36 +0000224 switch (ch) {
225 case '/':
Igor Sysoev02025fd2005-01-18 13:03:58 +0000226 r->port_end = p;
227 r->uri_start = p;
Igor Sysoeva3677242004-04-14 05:57:36 +0000228 state = sw_after_slash_in_uri;
229 break;
230 default:
Igor Sysoev1ebfead2005-02-16 13:40:36 +0000231 return NGX_HTTP_PARSE_INVALID_REQUEST;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000232 }
233 break;
234
Igor Sysoev1b735832004-11-11 14:07:14 +0000235 /* check "/.", "//", "%", and "\" (Win32) in URI */
Igor Sysoev016b8522002-08-29 16:59:54 +0000236 case sw_after_slash_in_uri:
Igor Sysoev1ebfead2005-02-16 13:40:36 +0000237
Igor Sysoev02f742b2005-04-08 15:18:55 +0000238 c = (u_char) (ch | 0x20);
Igor Sysoev7b190b42005-06-07 15:56:31 +0000239 if (c >= 'a' && c <= 'z') {
Igor Sysoev02f742b2005-04-08 15:18:55 +0000240 state = sw_check_uri;
241 break;
242 }
243
244 if (ch >= '0' && ch <= '9') {
Igor Sysoev1ebfead2005-02-16 13:40:36 +0000245 state = sw_check_uri;
246 break;
247 }
248
Igor Sysoev0c331d92002-08-15 17:20:26 +0000249 switch (ch) {
Igor Sysoev1ebfead2005-02-16 13:40:36 +0000250 case ' ':
251 r->uri_end = p;
252 state = sw_http_09;
253 break;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000254 case CR:
Igor Sysoev02025fd2005-01-18 13:03:58 +0000255 r->uri_end = p;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000256 r->http_minor = 9;
Igor Sysoev016b8522002-08-29 16:59:54 +0000257 state = sw_almost_done;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000258 break;
259 case LF:
Igor Sysoev02025fd2005-01-18 13:03:58 +0000260 r->uri_end = p;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000261 r->http_minor = 9;
Igor Sysoev02025fd2005-01-18 13:03:58 +0000262 goto done;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000263 case '.':
264 r->complex_uri = 1;
Igor Sysoev016b8522002-08-29 16:59:54 +0000265 state = sw_uri;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000266 break;
Igor Sysoev924bd792004-10-11 15:07:03 +0000267 case '%':
268 r->quoted_uri = 1;
269 state = sw_uri;
270 break;
Igor Sysoev1ebfead2005-02-16 13:40:36 +0000271 case '/':
272 r->complex_uri = 1;
273 state = sw_uri;
274 break;
Igor Sysoev1b735832004-11-11 14:07:14 +0000275#if (NGX_WIN32)
276 case '\\':
277 r->complex_uri = 1;
Igor Sysoev1ebfead2005-02-16 13:40:36 +0000278 state = sw_uri;
Igor Sysoev1b735832004-11-11 14:07:14 +0000279 break;
280#endif
Igor Sysoev1ebfead2005-02-16 13:40:36 +0000281 case '?':
282 r->args_start = p + 1;
283 state = sw_uri;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000284 break;
Igor Sysoevb80a7f42006-10-28 10:15:31 +0000285 case '#':
286 r->complex_uri = 1;
287 state = sw_uri;
288 break;
Igor Sysoev805d9db2005-02-03 19:33:37 +0000289 case '+':
290 r->plus_in_uri = 1;
291 break;
Igor Sysoev1ebfead2005-02-16 13:40:36 +0000292 case '\0':
293 r->zero_in_uri = 1;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000294 break;
295 default:
Igor Sysoev016b8522002-08-29 16:59:54 +0000296 state = sw_check_uri;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000297 break;
298 }
299 break;
300
Igor Sysoev1b735832004-11-11 14:07:14 +0000301 /* check "/", "%" and "\" (Win32) in URI */
Igor Sysoev016b8522002-08-29 16:59:54 +0000302 case sw_check_uri:
Igor Sysoev1ebfead2005-02-16 13:40:36 +0000303
Igor Sysoev02f742b2005-04-08 15:18:55 +0000304 c = (u_char) (ch | 0x20);
Igor Sysoev7b190b42005-06-07 15:56:31 +0000305 if (c >= 'a' && c <= 'z') {
Igor Sysoev02f742b2005-04-08 15:18:55 +0000306 break;
307 }
308
309 if (ch >= '0' && ch <= '9') {
Igor Sysoev1ebfead2005-02-16 13:40:36 +0000310 break;
311 }
312
Igor Sysoev0c331d92002-08-15 17:20:26 +0000313 switch (ch) {
Igor Sysoev1ebfead2005-02-16 13:40:36 +0000314 case '/':
315 r->uri_ext = NULL;
316 state = sw_after_slash_in_uri;
317 break;
318 case '.':
319 r->uri_ext = p + 1;
320 break;
321 case ' ':
322 r->uri_end = p;
323 state = sw_http_09;
324 break;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000325 case CR:
Igor Sysoev02025fd2005-01-18 13:03:58 +0000326 r->uri_end = p;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000327 r->http_minor = 9;
Igor Sysoev016b8522002-08-29 16:59:54 +0000328 state = sw_almost_done;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000329 break;
330 case LF:
Igor Sysoev02025fd2005-01-18 13:03:58 +0000331 r->uri_end = p;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000332 r->http_minor = 9;
Igor Sysoev02025fd2005-01-18 13:03:58 +0000333 goto done;
Igor Sysoev1b735832004-11-11 14:07:14 +0000334#if (NGX_WIN32)
335 case '\\':
336 r->complex_uri = 1;
337 state = sw_after_slash_in_uri;
338 break;
339#endif
Igor Sysoev7578ec92003-06-02 15:24:30 +0000340 case '%':
Igor Sysoev924bd792004-10-11 15:07:03 +0000341 r->quoted_uri = 1;
Igor Sysoev7578ec92003-06-02 15:24:30 +0000342 state = sw_uri;
343 break;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000344 case '?':
Igor Sysoev02025fd2005-01-18 13:03:58 +0000345 r->args_start = p + 1;
Igor Sysoev016b8522002-08-29 16:59:54 +0000346 state = sw_uri;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000347 break;
Igor Sysoevb80a7f42006-10-28 10:15:31 +0000348 case '#':
349 r->complex_uri = 1;
350 state = sw_uri;
351 break;
Igor Sysoevef809b82006-06-28 16:00:26 +0000352 case '+':
353 r->plus_in_uri = 1;
354 break;
Igor Sysoev1ebfead2005-02-16 13:40:36 +0000355 case '\0':
356 r->zero_in_uri = 1;
357 break;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000358 }
359 break;
360
361 /* URI */
Igor Sysoev016b8522002-08-29 16:59:54 +0000362 case sw_uri:
Igor Sysoev0c331d92002-08-15 17:20:26 +0000363 switch (ch) {
Igor Sysoev1ebfead2005-02-16 13:40:36 +0000364 case ' ':
365 r->uri_end = p;
366 state = sw_http_09;
367 break;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000368 case CR:
Igor Sysoev02025fd2005-01-18 13:03:58 +0000369 r->uri_end = p;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000370 r->http_minor = 9;
Igor Sysoev016b8522002-08-29 16:59:54 +0000371 state = sw_almost_done;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000372 break;
373 case LF:
Igor Sysoev02025fd2005-01-18 13:03:58 +0000374 r->uri_end = p;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000375 r->http_minor = 9;
Igor Sysoev02025fd2005-01-18 13:03:58 +0000376 goto done;
Igor Sysoevb80a7f42006-10-28 10:15:31 +0000377 case '#':
378 r->complex_uri = 1;
379 break;
Igor Sysoev1ebfead2005-02-16 13:40:36 +0000380 case '\0':
381 r->zero_in_uri = 1;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000382 break;
383 }
384 break;
385
386 /* space+ after URI */
Igor Sysoev016b8522002-08-29 16:59:54 +0000387 case sw_http_09:
Igor Sysoev0c331d92002-08-15 17:20:26 +0000388 switch (ch) {
389 case ' ':
390 break;
391 case CR:
392 r->http_minor = 9;
Igor Sysoev016b8522002-08-29 16:59:54 +0000393 state = sw_almost_done;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000394 break;
395 case LF:
396 r->http_minor = 9;
Igor Sysoev02025fd2005-01-18 13:03:58 +0000397 goto done;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000398 case 'H':
Igor Sysoev02025fd2005-01-18 13:03:58 +0000399 r->http_protocol.data = p;
Igor Sysoeva9830112003-05-19 16:39:14 +0000400 state = sw_http_H;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000401 break;
402 default:
Igor Sysoev1af7c822002-09-13 14:47:42 +0000403 return NGX_HTTP_PARSE_INVALID_REQUEST;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000404 }
405 break;
406
Igor Sysoeva9830112003-05-19 16:39:14 +0000407 case sw_http_H:
408 switch (ch) {
409 case 'T':
410 state = sw_http_HT;
411 break;
412 default:
Igor Sysoev1af7c822002-09-13 14:47:42 +0000413 return NGX_HTTP_PARSE_INVALID_REQUEST;
Igor Sysoev4e9393a2003-01-09 05:36:00 +0000414 }
Igor Sysoeva9830112003-05-19 16:39:14 +0000415 break;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000416
Igor Sysoeva9830112003-05-19 16:39:14 +0000417 case sw_http_HT:
418 switch (ch) {
419 case 'T':
420 state = sw_http_HTT;
421 break;
422 default:
423 return NGX_HTTP_PARSE_INVALID_REQUEST;
424 }
425 break;
426
427 case sw_http_HTT:
428 switch (ch) {
429 case 'P':
430 state = sw_http_HTTP;
431 break;
432 default:
433 return NGX_HTTP_PARSE_INVALID_REQUEST;
434 }
435 break;
436
437 case sw_http_HTTP:
438 switch (ch) {
439 case '/':
440 state = sw_first_major_digit;
441 break;
442 default:
443 return NGX_HTTP_PARSE_INVALID_REQUEST;
444 }
Igor Sysoev0c331d92002-08-15 17:20:26 +0000445 break;
446
447 /* first digit of major HTTP version */
Igor Sysoev016b8522002-08-29 16:59:54 +0000448 case sw_first_major_digit:
Igor Sysoev4e9393a2003-01-09 05:36:00 +0000449 if (ch < '1' || ch > '9') {
Igor Sysoev1af7c822002-09-13 14:47:42 +0000450 return NGX_HTTP_PARSE_INVALID_REQUEST;
Igor Sysoev4e9393a2003-01-09 05:36:00 +0000451 }
Igor Sysoev0c331d92002-08-15 17:20:26 +0000452
453 r->http_major = ch - '0';
Igor Sysoev016b8522002-08-29 16:59:54 +0000454 state = sw_major_digit;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000455 break;
456
457 /* major HTTP version or dot */
Igor Sysoev016b8522002-08-29 16:59:54 +0000458 case sw_major_digit:
Igor Sysoev0c331d92002-08-15 17:20:26 +0000459 if (ch == '.') {
Igor Sysoev016b8522002-08-29 16:59:54 +0000460 state = sw_first_minor_digit;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000461 break;
462 }
463
Igor Sysoev4e9393a2003-01-09 05:36:00 +0000464 if (ch < '0' || ch > '9') {
Igor Sysoev1af7c822002-09-13 14:47:42 +0000465 return NGX_HTTP_PARSE_INVALID_REQUEST;
Igor Sysoev4e9393a2003-01-09 05:36:00 +0000466 }
Igor Sysoev0c331d92002-08-15 17:20:26 +0000467
468 r->http_major = r->http_major * 10 + ch - '0';
469 break;
470
471 /* first digit of minor HTTP version */
Igor Sysoev016b8522002-08-29 16:59:54 +0000472 case sw_first_minor_digit:
Igor Sysoev4e9393a2003-01-09 05:36:00 +0000473 if (ch < '0' || ch > '9') {
Igor Sysoev1af7c822002-09-13 14:47:42 +0000474 return NGX_HTTP_PARSE_INVALID_REQUEST;
Igor Sysoev4e9393a2003-01-09 05:36:00 +0000475 }
Igor Sysoev0c331d92002-08-15 17:20:26 +0000476
477 r->http_minor = ch - '0';
Igor Sysoev016b8522002-08-29 16:59:54 +0000478 state = sw_minor_digit;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000479 break;
480
481 /* minor HTTP version or end of request line */
Igor Sysoev016b8522002-08-29 16:59:54 +0000482 case sw_minor_digit:
Igor Sysoev0c331d92002-08-15 17:20:26 +0000483 if (ch == CR) {
Igor Sysoev016b8522002-08-29 16:59:54 +0000484 state = sw_almost_done;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000485 break;
486 }
487
488 if (ch == LF) {
Igor Sysoev02025fd2005-01-18 13:03:58 +0000489 goto done;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000490 }
491
Igor Sysoev4e9393a2003-01-09 05:36:00 +0000492 if (ch < '0' || ch > '9') {
Igor Sysoev1af7c822002-09-13 14:47:42 +0000493 return NGX_HTTP_PARSE_INVALID_REQUEST;
Igor Sysoev4e9393a2003-01-09 05:36:00 +0000494 }
Igor Sysoev0c331d92002-08-15 17:20:26 +0000495
496 r->http_minor = r->http_minor * 10 + ch - '0';
497 break;
498
499 /* end of request line */
Igor Sysoev016b8522002-08-29 16:59:54 +0000500 case sw_almost_done:
Igor Sysoev02025fd2005-01-18 13:03:58 +0000501 r->request_end = p - 1;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000502 switch (ch) {
503 case LF:
Igor Sysoev02025fd2005-01-18 13:03:58 +0000504 goto done;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000505 default:
Igor Sysoev1af7c822002-09-13 14:47:42 +0000506 return NGX_HTTP_PARSE_INVALID_REQUEST;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000507 }
Igor Sysoev0c331d92002-08-15 17:20:26 +0000508 }
509 }
510
Igor Sysoevdd888c42004-09-21 05:38:28 +0000511 b->pos = p;
Igor Sysoev02025fd2005-01-18 13:03:58 +0000512 r->state = state;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000513
Igor Sysoev02025fd2005-01-18 13:03:58 +0000514 return NGX_AGAIN;
Igor Sysoev4e9393a2003-01-09 05:36:00 +0000515
Igor Sysoev02025fd2005-01-18 13:03:58 +0000516done:
Igor Sysoev4e9393a2003-01-09 05:36:00 +0000517
Igor Sysoev02025fd2005-01-18 13:03:58 +0000518 b->pos = p + 1;
Igor Sysoev4e9393a2003-01-09 05:36:00 +0000519
Igor Sysoev02025fd2005-01-18 13:03:58 +0000520 if (r->request_end == NULL) {
521 r->request_end = p;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000522 }
Igor Sysoev02025fd2005-01-18 13:03:58 +0000523
524 r->http_version = r->http_major * 1000 + r->http_minor;
525 r->state = sw_start;
526
527 if (r->http_version == 9 && r->method != NGX_HTTP_GET) {
528 return NGX_HTTP_PARSE_INVALID_09_METHOD;
529 }
530
531 return NGX_OK;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000532}
533
Igor Sysoevc2bba092003-11-28 17:41:47 +0000534
Igor Sysoev899b44e2005-05-12 14:58:06 +0000535ngx_int_t
536ngx_http_parse_header_line(ngx_http_request_t *r, ngx_buf_t *b)
Igor Sysoev0c331d92002-08-15 17:20:26 +0000537{
Igor Sysoev02f742b2005-04-08 15:18:55 +0000538 u_char c, ch, *p;
Igor Sysoev3338cfd2006-05-11 14:43:47 +0000539 ngx_uint_t hash, i;
Igor Sysoevc2bba092003-11-28 17:41:47 +0000540 enum {
Igor Sysoev016b8522002-08-29 16:59:54 +0000541 sw_start = 0,
542 sw_name,
543 sw_space_before_value,
544 sw_value,
545 sw_space_after_value,
Igor Sysoev4d656dc2005-03-22 16:02:46 +0000546 sw_ignore_line,
Igor Sysoev016b8522002-08-29 16:59:54 +0000547 sw_almost_done,
Igor Sysoev4d656dc2005-03-22 16:02:46 +0000548 sw_header_almost_done
Igor Sysoev481b6432002-12-04 16:29:40 +0000549 } state;
550
Igor Sysoevbb8bbb72006-10-17 12:47:14 +0000551 /* the last '\0' is not needed because string is zero terminated */
552
Igor Sysoev3338cfd2006-05-11 14:43:47 +0000553 static u_char lowcase[] =
554 "\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0"
555 "\0\0\0\0\0\0\0\0\0\0\0\0\0-\0\0" "0123456789\0\0\0\0\0\0"
556 "\0abcdefghijklmnopqrstuvwxyz\0\0\0\0\0"
557 "\0abcdefghijklmnopqrstuvwxyz\0\0\0\0\0"
558 "\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0"
559 "\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0"
560 "\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0"
Igor Sysoevbb8bbb72006-10-17 12:47:14 +0000561 "\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0";
Igor Sysoev3338cfd2006-05-11 14:43:47 +0000562
Igor Sysoev481b6432002-12-04 16:29:40 +0000563 state = r->state;
Igor Sysoev02f742b2005-04-08 15:18:55 +0000564 hash = r->header_hash;
Igor Sysoev3338cfd2006-05-11 14:43:47 +0000565 i = r->lowcase_index;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000566
Igor Sysoev02025fd2005-01-18 13:03:58 +0000567 for (p = b->pos; p < b->last; p++) {
568 ch = *p;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000569
Igor Sysoev0c331d92002-08-15 17:20:26 +0000570 switch (state) {
571
572 /* first char */
Igor Sysoev016b8522002-08-29 16:59:54 +0000573 case sw_start:
Igor Sysoev3362b8d2005-05-14 18:42:03 +0000574 r->invalid_header = 0;
575
Igor Sysoev0c331d92002-08-15 17:20:26 +0000576 switch (ch) {
577 case CR:
Igor Sysoev02025fd2005-01-18 13:03:58 +0000578 r->header_end = p;
Igor Sysoev016b8522002-08-29 16:59:54 +0000579 state = sw_header_almost_done;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000580 break;
581 case LF:
Igor Sysoev02025fd2005-01-18 13:03:58 +0000582 r->header_end = p;
583 goto header_done;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000584 default:
Igor Sysoev016b8522002-08-29 16:59:54 +0000585 state = sw_name;
Igor Sysoev02025fd2005-01-18 13:03:58 +0000586 r->header_name_start = p;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000587
Igor Sysoev3338cfd2006-05-11 14:43:47 +0000588 c = lowcase[ch];
Igor Sysoev0c331d92002-08-15 17:20:26 +0000589
Igor Sysoev3338cfd2006-05-11 14:43:47 +0000590 if (c) {
591 hash = ngx_hash(0, c);
592 r->lowcase_header[0] = c;
593 i = 1;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000594 break;
Igor Sysoev4e9393a2003-01-09 05:36:00 +0000595 }
Igor Sysoev0c331d92002-08-15 17:20:26 +0000596
Igor Sysoev3362b8d2005-05-14 18:42:03 +0000597 r->invalid_header = 1;
598
Igor Sysoev4d656dc2005-03-22 16:02:46 +0000599 break;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000600
601 }
602 break;
603
604 /* header name */
Igor Sysoev016b8522002-08-29 16:59:54 +0000605 case sw_name:
Igor Sysoev3338cfd2006-05-11 14:43:47 +0000606 c = lowcase[ch];
607
608 if (c) {
609 hash = ngx_hash(hash, c);
610 r->lowcase_header[i++] = c;
611 i &= ~NGX_HTTP_LC_HEADER_LEN;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000612 break;
Igor Sysoev4e9393a2003-01-09 05:36:00 +0000613 }
Igor Sysoev0c331d92002-08-15 17:20:26 +0000614
615 if (ch == ':') {
Igor Sysoev02025fd2005-01-18 13:03:58 +0000616 r->header_name_end = p;
Igor Sysoev016b8522002-08-29 16:59:54 +0000617 state = sw_space_before_value;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000618 break;
619 }
620
Igor Sysoev899b44e2005-05-12 14:58:06 +0000621 if (ch == CR) {
622 r->header_name_end = p;
623 r->header_start = p;
624 r->header_end = p;
625 state = sw_almost_done;
626 break;
627 }
628
629 if (ch == LF) {
630 r->header_name_end = p;
631 r->header_start = p;
632 r->header_end = p;
633 goto done;
634 }
635
Igor Sysoev924bd792004-10-11 15:07:03 +0000636 /* IIS may send the duplicate "HTTP/1.1 ..." lines */
Igor Sysoev183f9a62003-04-09 15:42:08 +0000637 if (ch == '/'
Igor Sysoev899b44e2005-05-12 14:58:06 +0000638 && r->upstream
639 && p - r->header_name_start == 4
640 && ngx_strncmp(r->header_name_start, "HTTP", 4) == 0)
Igor Sysoev183f9a62003-04-09 15:42:08 +0000641 {
642 state = sw_ignore_line;
643 break;
Igor Sysoeve2a31542003-04-08 15:40:10 +0000644 }
645
Igor Sysoev3362b8d2005-05-14 18:42:03 +0000646 r->invalid_header = 1;
647
Igor Sysoev4d656dc2005-03-22 16:02:46 +0000648 break;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000649
650 /* space* before header value */
Igor Sysoev016b8522002-08-29 16:59:54 +0000651 case sw_space_before_value:
Igor Sysoev0c331d92002-08-15 17:20:26 +0000652 switch (ch) {
653 case ' ':
654 break;
655 case CR:
Igor Sysoev899b44e2005-05-12 14:58:06 +0000656 r->header_start = p;
657 r->header_end = p;
Igor Sysoev016b8522002-08-29 16:59:54 +0000658 state = sw_almost_done;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000659 break;
660 case LF:
Igor Sysoev899b44e2005-05-12 14:58:06 +0000661 r->header_start = p;
662 r->header_end = p;
Igor Sysoev02025fd2005-01-18 13:03:58 +0000663 goto done;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000664 default:
Igor Sysoev02025fd2005-01-18 13:03:58 +0000665 r->header_start = p;
Igor Sysoev016b8522002-08-29 16:59:54 +0000666 state = sw_value;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000667 break;
668 }
669 break;
670
671 /* header value */
Igor Sysoev016b8522002-08-29 16:59:54 +0000672 case sw_value:
Igor Sysoev0c331d92002-08-15 17:20:26 +0000673 switch (ch) {
674 case ' ':
Igor Sysoev02025fd2005-01-18 13:03:58 +0000675 r->header_end = p;
Igor Sysoev016b8522002-08-29 16:59:54 +0000676 state = sw_space_after_value;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000677 break;
678 case CR:
Igor Sysoev02025fd2005-01-18 13:03:58 +0000679 r->header_end = p;
Igor Sysoev016b8522002-08-29 16:59:54 +0000680 state = sw_almost_done;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000681 break;
682 case LF:
Igor Sysoev02025fd2005-01-18 13:03:58 +0000683 r->header_end = p;
684 goto done;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000685 }
686 break;
687
688 /* space* before end of header line */
Igor Sysoev016b8522002-08-29 16:59:54 +0000689 case sw_space_after_value:
Igor Sysoev0c331d92002-08-15 17:20:26 +0000690 switch (ch) {
691 case ' ':
692 break;
693 case CR:
Igor Sysoev016b8522002-08-29 16:59:54 +0000694 state = sw_almost_done;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000695 break;
696 case LF:
Igor Sysoev02025fd2005-01-18 13:03:58 +0000697 goto done;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000698 default:
Igor Sysoev016b8522002-08-29 16:59:54 +0000699 state = sw_value;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000700 break;
701 }
702 break;
703
Igor Sysoeve2a31542003-04-08 15:40:10 +0000704 /* ignore header line */
705 case sw_ignore_line:
706 switch (ch) {
707 case LF:
708 state = sw_start;
709 break;
710 default:
711 break;
712 }
713 break;
714
Igor Sysoev0c331d92002-08-15 17:20:26 +0000715 /* end of header line */
Igor Sysoev016b8522002-08-29 16:59:54 +0000716 case sw_almost_done:
Igor Sysoev0c331d92002-08-15 17:20:26 +0000717 switch (ch) {
Igor Sysoev8fea8852006-03-15 09:53:04 +0000718 case CR:
719 break;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000720 case LF:
Igor Sysoev02025fd2005-01-18 13:03:58 +0000721 goto done;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000722 default:
Igor Sysoev1af7c822002-09-13 14:47:42 +0000723 return NGX_HTTP_PARSE_INVALID_HEADER;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000724 }
Igor Sysoev455a7fc2006-03-21 08:20:41 +0000725 break;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000726
727 /* end of header */
Igor Sysoev016b8522002-08-29 16:59:54 +0000728 case sw_header_almost_done:
Igor Sysoev0c331d92002-08-15 17:20:26 +0000729 switch (ch) {
730 case LF:
Igor Sysoev02025fd2005-01-18 13:03:58 +0000731 goto header_done;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000732 default:
Igor Sysoev1af7c822002-09-13 14:47:42 +0000733 return NGX_HTTP_PARSE_INVALID_HEADER;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000734 }
Igor Sysoev0c331d92002-08-15 17:20:26 +0000735 }
736 }
737
Igor Sysoev369145c2004-05-28 15:49:23 +0000738 b->pos = p;
Igor Sysoev02025fd2005-01-18 13:03:58 +0000739 r->state = state;
Igor Sysoev02f742b2005-04-08 15:18:55 +0000740 r->header_hash = hash;
Igor Sysoev3338cfd2006-05-11 14:43:47 +0000741 r->lowcase_index = i;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000742
Igor Sysoev02025fd2005-01-18 13:03:58 +0000743 return NGX_AGAIN;
Igor Sysoev4e9393a2003-01-09 05:36:00 +0000744
Igor Sysoev02025fd2005-01-18 13:03:58 +0000745done:
Igor Sysoev4e9393a2003-01-09 05:36:00 +0000746
Igor Sysoev02025fd2005-01-18 13:03:58 +0000747 b->pos = p + 1;
748 r->state = sw_start;
Igor Sysoev02f742b2005-04-08 15:18:55 +0000749 r->header_hash = hash;
Igor Sysoev3338cfd2006-05-11 14:43:47 +0000750 r->lowcase_index = i;
Igor Sysoev02025fd2005-01-18 13:03:58 +0000751
752 return NGX_OK;
753
754header_done:
755
756 b->pos = p + 1;
757 r->state = sw_start;
758
759 return NGX_HTTP_PARSE_HEADER_DONE;
Igor Sysoev0c331d92002-08-15 17:20:26 +0000760}
Igor Sysoevc2bba092003-11-28 17:41:47 +0000761
762
Igor Sysoev899b44e2005-05-12 14:58:06 +0000763ngx_int_t
764ngx_http_parse_complex_uri(ngx_http_request_t *r)
Igor Sysoevc2bba092003-11-28 17:41:47 +0000765{
Igor Sysoev10a543a2004-03-16 07:10:12 +0000766 u_char c, ch, decoded, *p, *u;
Igor Sysoevc2bba092003-11-28 17:41:47 +0000767 enum {
768 sw_usual = 0,
769 sw_slash,
770 sw_dot,
771 sw_dot_dot,
Igor Sysoev1b735832004-11-11 14:07:14 +0000772#if (NGX_WIN32)
Igor Sysoevc2bba092003-11-28 17:41:47 +0000773 sw_dot_dot_dot,
774#endif
775 sw_quoted,
776 sw_quoted_second
777 } state, quoted_state;
778
Igor Sysoev02025fd2005-01-18 13:03:58 +0000779#if (NGX_SUPPRESS_WARN)
Igor Sysoevc2bba092003-11-28 17:41:47 +0000780 decoded = '\0';
781 quoted_state = sw_usual;
Igor Sysoev02025fd2005-01-18 13:03:58 +0000782#endif
Igor Sysoevc2bba092003-11-28 17:41:47 +0000783
784 state = sw_usual;
785 p = r->uri_start;
786 u = r->uri.data;
Igor Sysoev865c1502003-11-30 20:03:18 +0000787 r->uri_ext = NULL;
Igor Sysoev1b735832004-11-11 14:07:14 +0000788 r->args_start = NULL;
Igor Sysoevc2bba092003-11-28 17:41:47 +0000789
790 ch = *p++;
791
Igor Sysoev02025fd2005-01-18 13:03:58 +0000792 while (p <= r->uri_end) {
Igor Sysoev1b735832004-11-11 14:07:14 +0000793
794 /*
Igor Sysoev02025fd2005-01-18 13:03:58 +0000795 * we use "ch = *p++" inside the cycle, but this operation is safe,
Igor Sysoev1b735832004-11-11 14:07:14 +0000796 * because after the URI there is always at least one charcter:
797 * the line feed
798 */
Igor Sysoevc2bba092003-11-28 17:41:47 +0000799
Igor Sysoev54498db2004-02-11 17:08:49 +0000800 ngx_log_debug4(NGX_LOG_DEBUG_HTTP, r->connection->log, 0,
Igor Sysoev1b735832004-11-11 14:07:14 +0000801 "s:%d in:'%Xd:%c', out:'%c'", state, ch, ch, *u);
Igor Sysoevc2bba092003-11-28 17:41:47 +0000802
803 switch (state) {
Igor Sysoev09c684b2005-11-09 17:25:55 +0000804
Igor Sysoevc2bba092003-11-28 17:41:47 +0000805 case sw_usual:
806 switch(ch) {
Igor Sysoev1b735832004-11-11 14:07:14 +0000807#if (NGX_WIN32)
808 case '\\':
809 r->uri_ext = NULL;
810
811 if (p == r->uri_start + r->uri.len) {
812
813 /*
814 * we omit the last "\" to cause redirect because
815 * the browsers do not treat "\" as "/" in relative URL path
816 */
817
818 break;
819 }
820
821 state = sw_slash;
822 *u++ = '/';
823 break;
824#endif
Igor Sysoevc2bba092003-11-28 17:41:47 +0000825 case '/':
Igor Sysoev865c1502003-11-30 20:03:18 +0000826 r->uri_ext = NULL;
Igor Sysoevc2bba092003-11-28 17:41:47 +0000827 state = sw_slash;
828 *u++ = ch;
829 break;
830 case '%':
831 quoted_state = state;
832 state = sw_quoted;
833 break;
Igor Sysoev1b735832004-11-11 14:07:14 +0000834 case '?':
835 r->args_start = p;
Igor Sysoevb80a7f42006-10-28 10:15:31 +0000836 goto args;
837 case '#':
Igor Sysoev02025fd2005-01-18 13:03:58 +0000838 goto done;
Igor Sysoev865c1502003-11-30 20:03:18 +0000839 case '.':
840 r->uri_ext = u + 1;
Igor Sysoev42b12b32004-12-02 18:40:46 +0000841 *u++ = ch;
842 break;
Igor Sysoevef809b82006-06-28 16:00:26 +0000843 case '+':
844 r->plus_in_uri = 1;
Igor Sysoevc2bba092003-11-28 17:41:47 +0000845 default:
846 *u++ = ch;
847 break;
848 }
849 ch = *p++;
850 break;
851
852 case sw_slash:
853 switch(ch) {
Igor Sysoev1b735832004-11-11 14:07:14 +0000854#if (NGX_WIN32)
855 case '\\':
Igor Sysoev1b735832004-11-11 14:07:14 +0000856#endif
Igor Sysoevc2bba092003-11-28 17:41:47 +0000857 case '/':
858 break;
859 case '.':
860 state = sw_dot;
861 *u++ = ch;
862 break;
863 case '%':
864 quoted_state = state;
865 state = sw_quoted;
866 break;
Igor Sysoev02025fd2005-01-18 13:03:58 +0000867 case '?':
868 r->args_start = p;
Igor Sysoevb80a7f42006-10-28 10:15:31 +0000869 goto args;
870 case '#':
Igor Sysoev02025fd2005-01-18 13:03:58 +0000871 goto done;
Igor Sysoevef809b82006-06-28 16:00:26 +0000872 case '+':
873 r->plus_in_uri = 1;
Igor Sysoevc2bba092003-11-28 17:41:47 +0000874 default:
875 state = sw_usual;
876 *u++ = ch;
877 break;
878 }
879 ch = *p++;
880 break;
881
882 case sw_dot:
883 switch(ch) {
Igor Sysoev1b735832004-11-11 14:07:14 +0000884#if (NGX_WIN32)
885 case '\\':
Igor Sysoev1b735832004-11-11 14:07:14 +0000886#endif
Igor Sysoevc2bba092003-11-28 17:41:47 +0000887 case '/':
888 state = sw_slash;
889 u--;
890 break;
891 case '.':
892 state = sw_dot_dot;
893 *u++ = ch;
894 break;
895 case '%':
896 quoted_state = state;
897 state = sw_quoted;
898 break;
Igor Sysoev02025fd2005-01-18 13:03:58 +0000899 case '?':
900 r->args_start = p;
Igor Sysoevb80a7f42006-10-28 10:15:31 +0000901 goto args;
902 case '#':
Igor Sysoev02025fd2005-01-18 13:03:58 +0000903 goto done;
Igor Sysoevef809b82006-06-28 16:00:26 +0000904 case '+':
905 r->plus_in_uri = 1;
Igor Sysoevc2bba092003-11-28 17:41:47 +0000906 default:
907 state = sw_usual;
908 *u++ = ch;
909 break;
910 }
911 ch = *p++;
912 break;
913
914 case sw_dot_dot:
915 switch(ch) {
Igor Sysoev1b735832004-11-11 14:07:14 +0000916#if (NGX_WIN32)
917 case '\\':
Igor Sysoev1b735832004-11-11 14:07:14 +0000918#endif
Igor Sysoevc2bba092003-11-28 17:41:47 +0000919 case '/':
920 state = sw_slash;
921 u -= 4;
922 if (u < r->uri.data) {
923 return NGX_HTTP_PARSE_INVALID_REQUEST;
924 }
925 while (*(u - 1) != '/') {
926 u--;
927 }
928 break;
929 case '%':
930 quoted_state = state;
931 state = sw_quoted;
932 break;
Igor Sysoev02025fd2005-01-18 13:03:58 +0000933 case '?':
934 r->args_start = p;
Igor Sysoevb80a7f42006-10-28 10:15:31 +0000935 goto args;
936 case '#':
Igor Sysoev02025fd2005-01-18 13:03:58 +0000937 goto done;
Igor Sysoev1b735832004-11-11 14:07:14 +0000938#if (NGX_WIN32)
Igor Sysoevc2bba092003-11-28 17:41:47 +0000939 case '.':
940 state = sw_dot_dot_dot;
941 *u++ = ch;
942 break;
943#endif
Igor Sysoevef809b82006-06-28 16:00:26 +0000944 case '+':
945 r->plus_in_uri = 1;
Igor Sysoevc2bba092003-11-28 17:41:47 +0000946 default:
947 state = sw_usual;
948 *u++ = ch;
949 break;
950 }
951 ch = *p++;
952 break;
953
Igor Sysoev1b735832004-11-11 14:07:14 +0000954#if (NGX_WIN32)
Igor Sysoevc2bba092003-11-28 17:41:47 +0000955 case sw_dot_dot_dot:
956 switch(ch) {
Igor Sysoev1b735832004-11-11 14:07:14 +0000957 case '\\':
Igor Sysoevc2bba092003-11-28 17:41:47 +0000958 case '/':
959 state = sw_slash;
960 u -= 5;
961 if (u < r->uri.data) {
962 return NGX_HTTP_PARSE_INVALID_REQUEST;
963 }
964 while (*u != '/') {
965 u--;
966 }
967 if (u < r->uri.data) {
968 return NGX_HTTP_PARSE_INVALID_REQUEST;
969 }
970 while (*(u - 1) != '/') {
971 u--;
972 }
973 break;
974 case '%':
975 quoted_state = state;
976 state = sw_quoted;
977 break;
Igor Sysoev09c684b2005-11-09 17:25:55 +0000978 case '?':
979 r->args_start = p;
Igor Sysoevb80a7f42006-10-28 10:15:31 +0000980 goto args;
981 case '#':
Igor Sysoev09c684b2005-11-09 17:25:55 +0000982 goto done;
Igor Sysoevef809b82006-06-28 16:00:26 +0000983 case '+':
984 r->plus_in_uri = 1;
Igor Sysoevc2bba092003-11-28 17:41:47 +0000985 default:
986 state = sw_usual;
987 *u++ = ch;
988 break;
989 }
990 ch = *p++;
991 break;
992#endif
993
994 case sw_quoted:
Igor Sysoev8f125582006-07-28 15:16:17 +0000995 r->quoted_uri = 1;
996
Igor Sysoevc2bba092003-11-28 17:41:47 +0000997 if (ch >= '0' && ch <= '9') {
Igor Sysoev9c610952004-03-16 13:35:20 +0000998 decoded = (u_char) (ch - '0');
Igor Sysoevc2bba092003-11-28 17:41:47 +0000999 state = sw_quoted_second;
1000 ch = *p++;
1001 break;
1002 }
1003
Igor Sysoev9c610952004-03-16 13:35:20 +00001004 c = (u_char) (ch | 0x20);
Igor Sysoevc2bba092003-11-28 17:41:47 +00001005 if (c >= 'a' && c <= 'f') {
Igor Sysoev9c610952004-03-16 13:35:20 +00001006 decoded = (u_char) (c - 'a' + 10);
Igor Sysoevc2bba092003-11-28 17:41:47 +00001007 state = sw_quoted_second;
1008 ch = *p++;
1009 break;
1010 }
1011
1012 return NGX_HTTP_PARSE_INVALID_REQUEST;
1013
1014 case sw_quoted_second:
1015 if (ch >= '0' && ch <= '9') {
Igor Sysoev9c610952004-03-16 13:35:20 +00001016 ch = (u_char) ((decoded << 4) + ch - '0');
Igor Sysoev1ebfead2005-02-16 13:40:36 +00001017
Igor Sysoev7adb8c02003-12-02 16:57:05 +00001018 if (ch == '%') {
1019 state = sw_usual;
1020 *u++ = ch;
1021 ch = *p++;
1022 break;
1023 }
Igor Sysoev1ebfead2005-02-16 13:40:36 +00001024
Igor Sysoevb80a7f42006-10-28 10:15:31 +00001025 if (ch == '#') {
1026 *u++ = ch;
1027 ch = *p++;
1028
1029 } else if (ch == '\0') {
Igor Sysoev1ebfead2005-02-16 13:40:36 +00001030 r->zero_in_uri = 1;
Igor Sysoev1ebfead2005-02-16 13:40:36 +00001031 }
1032
Igor Sysoevc2bba092003-11-28 17:41:47 +00001033 state = quoted_state;
1034 break;
1035 }
1036
Igor Sysoev9c610952004-03-16 13:35:20 +00001037 c = (u_char) (ch | 0x20);
Igor Sysoevc2bba092003-11-28 17:41:47 +00001038 if (c >= 'a' && c <= 'f') {
Igor Sysoev9c610952004-03-16 13:35:20 +00001039 ch = (u_char) ((decoded << 4) + c - 'a' + 10);
Igor Sysoevef809b82006-06-28 16:00:26 +00001040
Igor Sysoev02025fd2005-01-18 13:03:58 +00001041 if (ch == '?') {
Igor Sysoev7adb8c02003-12-02 16:57:05 +00001042 *u++ = ch;
1043 ch = *p++;
Igor Sysoevef809b82006-06-28 16:00:26 +00001044
1045 } else if (ch == '+') {
1046 r->plus_in_uri = 1;
Igor Sysoev7adb8c02003-12-02 16:57:05 +00001047 }
Igor Sysoevef809b82006-06-28 16:00:26 +00001048
Igor Sysoevc2bba092003-11-28 17:41:47 +00001049 state = quoted_state;
1050 break;
1051 }
1052
1053 return NGX_HTTP_PARSE_INVALID_REQUEST;
1054 }
1055 }
1056
Igor Sysoev02025fd2005-01-18 13:03:58 +00001057done:
1058
Igor Sysoevc2bba092003-11-28 17:41:47 +00001059 r->uri.len = u - r->uri.data;
Igor Sysoevc2bba092003-11-28 17:41:47 +00001060
Igor Sysoev865c1502003-11-30 20:03:18 +00001061 if (r->uri_ext) {
1062 r->exten.len = u - r->uri_ext;
Igor Sysoev1b735832004-11-11 14:07:14 +00001063 r->exten.data = r->uri_ext;
Igor Sysoev865c1502003-11-30 20:03:18 +00001064 }
1065
1066 r->uri_ext = NULL;
1067
Igor Sysoevc2bba092003-11-28 17:41:47 +00001068 return NGX_OK;
Igor Sysoevb80a7f42006-10-28 10:15:31 +00001069
1070args:
1071
1072 while (p < r->uri_end) {
1073 if (*p++ != '#') {
1074 continue;
1075 }
1076
1077 r->args.len = p - 1 - r->args_start;
1078 r->args.data = r->args_start;
1079 r->args_start = NULL;
1080
1081 break;
1082 }
1083
1084 r->uri.len = u - r->uri.data;
1085
1086 if (r->uri_ext) {
1087 r->exten.len = u - r->uri_ext;
1088 r->exten.data = r->uri_ext;
1089 }
1090
1091 r->uri_ext = NULL;
1092
1093 return NGX_OK;
Igor Sysoevc2bba092003-11-28 17:41:47 +00001094}
Igor Sysoev899b44e2005-05-12 14:58:06 +00001095
1096
1097ngx_int_t
Igor Sysoev09c684b2005-11-09 17:25:55 +00001098ngx_http_parse_unsafe_uri(ngx_http_request_t *r, ngx_str_t *uri,
1099 ngx_str_t *args, ngx_uint_t *flags)
1100{
1101 u_char ch, *p;
1102 size_t len;
1103
1104 len = uri->len;
1105 p = uri->data;
1106
1107 if (len == 0 || p[0] == '?') {
1108 goto unsafe;
1109 }
1110
1111 if (p[0] == '.' && len == 3 && p[1] == '.' && (p[2] == '/'
1112#if (NGX_WIN32)
1113 || p[2] == '\\'
1114#endif
1115 ))
1116 {
1117 goto unsafe;
1118 }
1119
1120 for ( /* void */ ; len; len--) {
1121
1122 ch = *p++;
1123
1124 if (ch == '?') {
1125 args->len = len - 1;
1126 args->data = p;
1127 uri->len -= len;
1128
1129 return NGX_OK;
1130 }
1131
1132 if (ch == '\0') {
1133 *flags |= NGX_HTTP_ZERO_IN_URI;
1134 continue;
1135 }
1136
1137 if (ch != '/'
1138#if (NGX_WIN32)
1139 && ch != '\\'
1140#endif
1141 )
1142 {
1143 continue;
1144 }
1145
1146 if (len > 2) {
1147
1148 /* detect "/../" */
1149
Igor Sysoev3fc6f642005-11-10 07:44:53 +00001150 if (p[0] == '.' && p[1] == '.' && p[2] == '/') {
Igor Sysoev09c684b2005-11-09 17:25:55 +00001151 goto unsafe;
1152 }
1153
1154#if (NGX_WIN32)
1155
1156 if (p[2] == '\\') {
1157 goto unsafe;
1158 }
1159
1160 if (len > 3) {
1161
1162 /* detect "/.../" */
1163
Igor Sysoev3fc6f642005-11-10 07:44:53 +00001164 if (p[0] == '.' && p[1] == '.' && p[2] == '.'
1165 && (p[3] == '/' || p[3] == '\\'))
1166 {
Igor Sysoev09c684b2005-11-09 17:25:55 +00001167 goto unsafe;
1168 }
1169 }
1170#endif
1171 }
1172 }
1173
1174 return NGX_OK;
1175
1176unsafe:
1177
1178 ngx_log_error(NGX_LOG_ERR, r->connection->log, 0,
1179 "unsafe URI \"%V\" was detected", uri);
1180
1181 return NGX_ERROR;
1182}
1183
1184
1185ngx_int_t
Igor Sysoev899b44e2005-05-12 14:58:06 +00001186ngx_http_parse_multi_header_lines(ngx_array_t *headers, ngx_str_t *name,
1187 ngx_str_t *value)
1188{
1189 ngx_uint_t i;
1190 u_char *start, *last, *end, ch;
1191 ngx_table_elt_t **h;
1192
1193 h = headers->elts;
1194
1195 for (i = 0; i < headers->nelts; i++) {
1196
1197 ngx_log_debug2(NGX_LOG_DEBUG_HTTP, headers->pool->log, 0,
1198 "parse header: \"%V: %V\"", &h[i]->key, &h[i]->value);
1199
1200 if (name->len > h[i]->value.len) {
1201 continue;
1202 }
Igor Sysoev0e5dc5c2005-11-15 13:30:52 +00001203
Igor Sysoev899b44e2005-05-12 14:58:06 +00001204 start = h[i]->value.data;
1205 end = h[i]->value.data + h[i]->value.len;
1206
1207 while (start < end) {
1208
1209 if (ngx_strncasecmp(start, name->data, name->len) != 0) {
1210 goto skip;
1211 }
1212
1213 for (start += name->len; start < end && *start == ' '; start++) {
1214 /* void */
1215 }
1216
1217 if (value == NULL) {
1218 if (start == end || *start == ',') {
1219 return i;
1220 }
1221
1222 goto skip;
1223 }
1224
1225 if (start == end || *start++ != '=') {
1226 /* the invalid header value */
1227 goto skip;
1228 }
1229
1230 while (start < end && *start == ' ') { start++; }
1231
1232 for (last = start; last < end && *last != ';'; last++) {
1233 /* void */
1234 }
1235
1236 value->len = last - start;
1237 value->data = start;
1238
1239 return i;
1240
1241 skip:
Igor Sysoev09c684b2005-11-09 17:25:55 +00001242
Igor Sysoev899b44e2005-05-12 14:58:06 +00001243 while (start < end) {
1244 ch = *start++;
1245 if (ch == ';' || ch == ',') {
1246 break;
1247 }
1248 }
1249
1250 while (start < end && *start == ' ') { start++; }
1251 }
1252 }
1253
1254 return NGX_DECLINED;
1255}