123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322 |
- /***************************************************************************
- * _ _ ____ _
- * Project ___| | | | _ \| |
- * / __| | | | |_) | |
- * | (__| |_| | _ <| |___
- * \___|\___/|_| \_\_____|
- *
- * Copyright (C) Daniel Stenberg, <daniel@haxx.se>, et al.
- *
- * This software is licensed as described in the file COPYING, which
- * you should have received as part of this distribution. The terms
- * are also available at https://curl.se/docs/copyright.html.
- *
- * You may opt to use, copy, modify, merge, publish, distribute and/or sell
- * copies of the Software, and permit persons to whom the Software is
- * furnished to do so, under the terms of the COPYING file.
- *
- * This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
- * KIND, either express or implied.
- *
- * SPDX-License-Identifier: curl
- *
- ***************************************************************************/
- #include "curl_setup.h"
- #ifndef CURL_DISABLE_HTTP
- #include "urldata.h"
- #include <curl/curl.h>
- #include "http.h"
- #include "http1.h"
- #include "urlapi-int.h"
- /* The last 3 #include files should be in this order */
- #include "curl_printf.h"
- #include "curl_memory.h"
- #include "memdebug.h"
- #define H1_MAX_URL_LEN (8*1024)
- void Curl_h1_req_parse_init(struct h1_req_parser *parser, size_t max_line_len)
- {
- memset(parser, 0, sizeof(*parser));
- parser->max_line_len = max_line_len;
- Curl_dyn_init(&parser->scratch, max_line_len);
- }
- void Curl_h1_req_parse_free(struct h1_req_parser *parser)
- {
- if(parser) {
- Curl_http_req_free(parser->req);
- Curl_dyn_free(&parser->scratch);
- parser->req = NULL;
- parser->done = FALSE;
- }
- }
- static CURLcode trim_line(struct h1_req_parser *parser, int options)
- {
- DEBUGASSERT(parser->line);
- if(parser->line_len) {
- if(parser->line[parser->line_len - 1] == '\n')
- --parser->line_len;
- if(parser->line_len) {
- if(parser->line[parser->line_len - 1] == '\r')
- --parser->line_len;
- else if(options & H1_PARSE_OPT_STRICT)
- return CURLE_URL_MALFORMAT;
- }
- else if(options & H1_PARSE_OPT_STRICT)
- return CURLE_URL_MALFORMAT;
- }
- else if(options & H1_PARSE_OPT_STRICT)
- return CURLE_URL_MALFORMAT;
- if(parser->line_len > parser->max_line_len) {
- return CURLE_URL_MALFORMAT;
- }
- return CURLE_OK;
- }
- static ssize_t detect_line(struct h1_req_parser *parser,
- const char *buf, const size_t buflen,
- CURLcode *err)
- {
- const char *line_end;
- DEBUGASSERT(!parser->line);
- line_end = memchr(buf, '\n', buflen);
- if(!line_end) {
- *err = CURLE_AGAIN;
- return -1;
- }
- parser->line = buf;
- parser->line_len = line_end - buf + 1;
- *err = CURLE_OK;
- return (ssize_t)parser->line_len;
- }
- static ssize_t next_line(struct h1_req_parser *parser,
- const char *buf, const size_t buflen, int options,
- CURLcode *err)
- {
- ssize_t nread = 0;
- if(parser->line) {
- parser->line = NULL;
- parser->line_len = 0;
- Curl_dyn_reset(&parser->scratch);
- }
- nread = detect_line(parser, buf, buflen, err);
- if(nread >= 0) {
- if(Curl_dyn_len(&parser->scratch)) {
- /* append detected line to scratch to have the complete line */
- *err = Curl_dyn_addn(&parser->scratch, parser->line, parser->line_len);
- if(*err)
- return -1;
- parser->line = Curl_dyn_ptr(&parser->scratch);
- parser->line_len = Curl_dyn_len(&parser->scratch);
- }
- *err = trim_line(parser, options);
- if(*err)
- return -1;
- }
- else if(*err == CURLE_AGAIN) {
- /* no line end in `buf`, add it to our scratch */
- *err = Curl_dyn_addn(&parser->scratch, (const unsigned char *)buf, buflen);
- nread = (*err)? -1 : (ssize_t)buflen;
- }
- return nread;
- }
- static CURLcode start_req(struct h1_req_parser *parser,
- const char *scheme_default, int options)
- {
- const char *p, *m, *target, *hv, *scheme, *authority, *path;
- size_t m_len, target_len, hv_len, scheme_len, authority_len, path_len;
- size_t i;
- CURLU *url = NULL;
- CURLcode result = CURLE_URL_MALFORMAT; /* Use this as default fail */
- DEBUGASSERT(!parser->req);
- /* line must match: "METHOD TARGET HTTP_VERSION" */
- p = memchr(parser->line, ' ', parser->line_len);
- if(!p || p == parser->line)
- goto out;
- m = parser->line;
- m_len = p - parser->line;
- target = p + 1;
- target_len = hv_len = 0;
- hv = NULL;
- /* URL may contain spaces so scan backwards */
- for(i = parser->line_len; i > m_len; --i) {
- if(parser->line[i] == ' ') {
- hv = &parser->line[i + 1];
- hv_len = parser->line_len - i;
- target_len = (hv - target) - 1;
- break;
- }
- }
- /* no SPACE found or empty TARGET or empy HTTP_VERSION */
- if(!target_len || !hv_len)
- goto out;
- /* TODO: we do not check HTTP_VERSION for conformity, should
- + do that when STRICT option is supplied. */
- (void)hv;
- /* The TARGET can be (rfc 9112, ch. 3.2):
- * origin-form: path + optional query
- * absolute-form: absolute URI
- * authority-form: host+port for CONNECT
- * asterisk-form: '*' for OPTIONS
- *
- * from TARGET, we derive `scheme` `authority` `path`
- * origin-form -- -- TARGET
- * absolute-form URL* URL* URL*
- * authority-form -- TARGET --
- * asterisk-form -- -- TARGET
- */
- scheme = authority = path = NULL;
- scheme_len = authority_len = path_len = 0;
- if(target_len == 1 && target[0] == '*') {
- /* asterisk-form */
- path = target;
- path_len = target_len;
- }
- else if(!strncmp("CONNECT", m, m_len)) {
- /* authority-form */
- authority = target;
- authority_len = target_len;
- }
- else if(target[0] == '/') {
- /* origin-form */
- path = target;
- path_len = target_len;
- }
- else {
- /* origin-form OR absolute-form */
- CURLUcode uc;
- char tmp[H1_MAX_URL_LEN];
- /* default, unless we see an absolute URL */
- path = target;
- path_len = target_len;
- /* URL parser wants 0-termination */
- if(target_len >= sizeof(tmp))
- goto out;
- memcpy(tmp, target, target_len);
- tmp[target_len] = '\0';
- /* See if treating TARGET as an absolute URL makes sense */
- if(Curl_is_absolute_url(tmp, NULL, 0, FALSE)) {
- int url_options;
- url = curl_url();
- if(!url) {
- result = CURLE_OUT_OF_MEMORY;
- goto out;
- }
- url_options = (CURLU_NON_SUPPORT_SCHEME|
- CURLU_PATH_AS_IS|
- CURLU_NO_DEFAULT_PORT);
- if(!(options & H1_PARSE_OPT_STRICT))
- url_options |= CURLU_ALLOW_SPACE;
- uc = curl_url_set(url, CURLUPART_URL, tmp, url_options);
- if(uc) {
- goto out;
- }
- }
- if(!url && (options & H1_PARSE_OPT_STRICT)) {
- /* we should have an absolute URL or have seen `/` earlier */
- goto out;
- }
- }
- if(url) {
- result = Curl_http_req_make2(&parser->req, m, m_len, url, scheme_default);
- }
- else {
- if(!scheme && scheme_default) {
- scheme = scheme_default;
- scheme_len = strlen(scheme_default);
- }
- result = Curl_http_req_make(&parser->req, m, m_len, scheme, scheme_len,
- authority, authority_len, path, path_len);
- }
- out:
- curl_url_cleanup(url);
- return result;
- }
- ssize_t Curl_h1_req_parse_read(struct h1_req_parser *parser,
- const char *buf, size_t buflen,
- const char *scheme_default, int options,
- CURLcode *err)
- {
- ssize_t nread = 0, n;
- *err = CURLE_OK;
- while(!parser->done) {
- n = next_line(parser, buf, buflen, options, err);
- if(n < 0) {
- if(*err != CURLE_AGAIN) {
- nread = -1;
- }
- *err = CURLE_OK;
- goto out;
- }
- /* Consume this line */
- nread += (size_t)n;
- buf += (size_t)n;
- buflen -= (size_t)n;
- if(!parser->line) {
- /* consumed bytes, but line not complete */
- if(!buflen)
- goto out;
- }
- else if(!parser->req) {
- *err = start_req(parser, scheme_default, options);
- if(*err) {
- nread = -1;
- goto out;
- }
- }
- else if(parser->line_len == 0) {
- /* last, empty line, we are finished */
- if(!parser->req) {
- *err = CURLE_URL_MALFORMAT;
- nread = -1;
- goto out;
- }
- parser->done = TRUE;
- Curl_dyn_reset(&parser->scratch);
- /* last chance adjustments */
- }
- else {
- *err = Curl_dynhds_h1_add_line(&parser->req->headers,
- parser->line, parser->line_len);
- if(*err) {
- nread = -1;
- goto out;
- }
- }
- }
- out:
- return nread;
- }
- #endif /* !CURL_DISABLE_HTTP */
|