curl-w32/lib/http1.c

/***************************************************************************
 *                                  _   _ ____  _
 *  Project                     ___| | | |  _ \| |
 *                             / __| | | | |_) | |
 *                            | (__| |_| |  _ <| |___
 *                             \___|\___/|_| \_\_____|
 *
 * Copyright (C) Daniel Stenberg, <daniel@haxx.se>, et al.
 *
 * This software is licensed as described in the file COPYING, which
 * you should have received as part of this distribution. The terms
 * are also available at https://curl.se/docs/copyright.html.
 *
 * You may opt to use, copy, modify, merge, publish, distribute and/or sell
 * copies of the Software, and permit persons to whom the Software is
 * furnished to do so, under the terms of the COPYING file.
 *
 * This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
 * KIND, either express or implied.
 *
 * SPDX-License-Identifier: curl
 *
 ***************************************************************************/

#include "curl_setup.h"

#ifndef CURL_DISABLE_HTTP

#include "urldata.h"
#include <curl/curl.h>
#include "http.h"
#include "http1.h"
#include "urlapi-int.h"

/* The last 3 #include files should be in this order */
#include "curl_printf.h"
#include "curl_memory.h"
#include "memdebug.h"


#define H1_MAX_URL_LEN   (8*1024)

void Curl_h1_req_parse_init(struct h1_req_parser *parser, size_t max_line_len)
{
  memset(parser, 0, sizeof(*parser));
  parser->max_line_len = max_line_len;
  Curl_dyn_init(&parser->scratch, max_line_len);
}

void Curl_h1_req_parse_free(struct h1_req_parser *parser)
{
  if(parser) {
    Curl_http_req_free(parser->req);
    Curl_dyn_free(&parser->scratch);
    parser->req = NULL;
    parser->done = FALSE;
  }
}

static CURLcode trim_line(struct h1_req_parser *parser, int options)
{
  DEBUGASSERT(parser->line);
  if(parser->line_len) {
    if(parser->line[parser->line_len - 1] == '\n')
      --parser->line_len;
    if(parser->line_len) {
      if(parser->line[parser->line_len - 1] == '\r')
        --parser->line_len;
      else if(options & H1_PARSE_OPT_STRICT)
        return CURLE_URL_MALFORMAT;
    }
    else if(options & H1_PARSE_OPT_STRICT)
      return CURLE_URL_MALFORMAT;
  }
  else if(options & H1_PARSE_OPT_STRICT)
    return CURLE_URL_MALFORMAT;

  if(parser->line_len > parser->max_line_len) {
    return CURLE_URL_MALFORMAT;
  }
  return CURLE_OK;
}

static ssize_t detect_line(struct h1_req_parser *parser,
                           const char *buf, const size_t buflen,
                           CURLcode *err)
{
  const char  *line_end;

  DEBUGASSERT(!parser->line);
  line_end = memchr(buf, '\n', buflen);
  if(!line_end) {
    *err = CURLE_AGAIN;
    return -1;
  }
  parser->line = buf;
  parser->line_len = line_end - buf + 1;
  *err = CURLE_OK;
  return (ssize_t)parser->line_len;
}

static ssize_t next_line(struct h1_req_parser *parser,
                         const char *buf, const size_t buflen, int options,
                         CURLcode *err)
{
  ssize_t nread = 0;

  if(parser->line) {
    parser->line = NULL;
    parser->line_len = 0;
    Curl_dyn_reset(&parser->scratch);
  }

  nread = detect_line(parser, buf, buflen, err);
  if(nread >= 0) {
    if(Curl_dyn_len(&parser->scratch)) {
      /* append detected line to scratch to have the complete line */
      *err = Curl_dyn_addn(&parser->scratch, parser->line, parser->line_len);
      if(*err)
        return -1;
      parser->line = Curl_dyn_ptr(&parser->scratch);
      parser->line_len = Curl_dyn_len(&parser->scratch);
    }
    *err = trim_line(parser, options);
    if(*err)
      return -1;
  }
  else if(*err == CURLE_AGAIN) {
    /* no line end in `buf`, add it to our scratch */
    *err = Curl_dyn_addn(&parser->scratch, (const unsigned char *)buf, buflen);
    nread = (*err)? -1 : (ssize_t)buflen;
  }
  return nread;
}

static CURLcode start_req(struct h1_req_parser *parser,
                          const char *scheme_default, int options)
{
  const char  *p, *m, *target, *hv, *scheme, *authority, *path;
  size_t m_len, target_len, hv_len, scheme_len, authority_len, path_len;
  size_t i;
  CURLU *url = NULL;
  CURLcode result = CURLE_URL_MALFORMAT; /* Use this as default fail */

  DEBUGASSERT(!parser->req);
  /* line must match: "METHOD TARGET HTTP_VERSION" */
  p = memchr(parser->line, ' ', parser->line_len);
  if(!p || p == parser->line)
    goto out;

  m = parser->line;
  m_len = p - parser->line;
  target = p + 1;
  target_len = hv_len = 0;
  hv = NULL;

  /* URL may contain spaces so scan backwards */
  for(i = parser->line_len; i > m_len; --i) {
    if(parser->line[i] == ' ') {
      hv = &parser->line[i + 1];
      hv_len = parser->line_len - i;
      target_len = (hv - target) - 1;
      break;
    }
  }
  /* no SPACE found or empty TARGET or empty HTTP_VERSION */
  if(!target_len || !hv_len)
    goto out;

  /* TODO: we do not check HTTP_VERSION for conformity, should
   + do that when STRICT option is supplied. */
  (void)hv;

  /* The TARGET can be (rfc 9112, ch. 3.2):
   * origin-form:     path + optional query
   * absolute-form:   absolute URI
   * authority-form:  host+port for CONNECT
   * asterisk-form:   '*' for OPTIONS
   *
   * from TARGET, we derive `scheme` `authority` `path`
   * origin-form            --        --          TARGET
   * absolute-form          URL*      URL*        URL*
   * authority-form         --        TARGET      --
   * asterisk-form          --        --          TARGET
   */
  scheme = authority = path = NULL;
  scheme_len = authority_len = path_len = 0;

  if(target_len == 1 && target[0] == '*') {
    /* asterisk-form */
    path = target;
    path_len = target_len;
  }
  else if(!strncmp("CONNECT", m, m_len)) {
    /* authority-form */
    authority = target;
    authority_len = target_len;
  }
  else if(target[0] == '/') {
    /* origin-form */
    path = target;
    path_len = target_len;
  }
  else {
    /* origin-form OR absolute-form */
    CURLUcode uc;
    char tmp[H1_MAX_URL_LEN];

    /* default, unless we see an absolute URL */
    path = target;
    path_len = target_len;

    /* URL parser wants 0-termination */
    if(target_len >= sizeof(tmp))
      goto out;
    memcpy(tmp, target, target_len);
    tmp[target_len] = '\0';
    /* See if treating TARGET as an absolute URL makes sense */
    if(Curl_is_absolute_url(tmp, NULL, 0, FALSE)) {
      int url_options;

      url = curl_url();
      if(!url) {
        result = CURLE_OUT_OF_MEMORY;
        goto out;
      }
      url_options = (CURLU_NON_SUPPORT_SCHEME|
                     CURLU_PATH_AS_IS|
                     CURLU_NO_DEFAULT_PORT);
      if(!(options & H1_PARSE_OPT_STRICT))
        url_options |= CURLU_ALLOW_SPACE;
      uc = curl_url_set(url, CURLUPART_URL, tmp, url_options);
      if(uc) {
        goto out;
      }
    }

    if(!url && (options & H1_PARSE_OPT_STRICT)) {
      /* we should have an absolute URL or have seen `/` earlier */
      goto out;
    }
  }

  if(url) {
    result = Curl_http_req_make2(&parser->req, m, m_len, url, scheme_default);
  }
  else {
    if(!scheme && scheme_default) {
      scheme = scheme_default;
      scheme_len = strlen(scheme_default);
    }
    result = Curl_http_req_make(&parser->req, m, m_len, scheme, scheme_len,
                                authority, authority_len, path, path_len);
  }

out:
  curl_url_cleanup(url);
  return result;
}

ssize_t Curl_h1_req_parse_read(struct h1_req_parser *parser,
                               const char *buf, size_t buflen,
                               const char *scheme_default, int options,
                               CURLcode *err)
{
  ssize_t nread = 0, n;

  *err = CURLE_OK;
  while(!parser->done) {
    n = next_line(parser, buf, buflen, options, err);
    if(n < 0) {
      if(*err != CURLE_AGAIN) {
        nread = -1;
      }
      *err = CURLE_OK;
      goto out;
    }

    /* Consume this line */
    nread += (size_t)n;
    buf += (size_t)n;
    buflen -= (size_t)n;

    if(!parser->line) {
      /* consumed bytes, but line not complete */
      if(!buflen)
        goto out;
    }
    else if(!parser->req) {
      *err = start_req(parser, scheme_default, options);
      if(*err) {
        nread = -1;
        goto out;
      }
    }
    else if(parser->line_len == 0) {
      /* last, empty line, we are finished */
      if(!parser->req) {
        *err = CURLE_URL_MALFORMAT;
        nread = -1;
        goto out;
      }
      parser->done = TRUE;
      Curl_dyn_reset(&parser->scratch);
      /* last chance adjustments */
    }
    else {
      *err = Curl_dynhds_h1_add_line(&parser->req->headers,
                                     parser->line, parser->line_len);
      if(*err) {
        nread = -1;
        goto out;
      }
    }
  }

out:
  return nread;
}

CURLcode Curl_h1_req_write_head(struct httpreq *req, int http_minor,
                                struct dynbuf *dbuf)
{
  CURLcode result;

  result = Curl_dyn_addf(dbuf, "%s %s%s%s%s HTTP/1.%d\r\n",
                         req->method,
                         req->scheme? req->scheme : "",
                         req->scheme? "://" : "",
                         req->authority? req->authority : "",
                         req->path? req->path : "",
                         http_minor);
  if(result)
    goto out;

  result = Curl_dynhds_h1_dprint(&req->headers, dbuf);
  if(result)
    goto out;

  result = Curl_dyn_addn(dbuf, STRCONST("\r\n"));

out:
  return result;
}

#endif /* !CURL_DISABLE_HTTP */
Import from curl-8.6.0.zip Upstream: https://github.com/curl/curl/releases/tag/curl-8_6_0 2024-03-02 03:51:05 +00:00			`/***************************************************************************`
			`* _ _ ____ _`
			`* Project ___\| \| \| \| _ \\| \|`
			`* / __\| \| \| \| \|_) \| \|`
			`* \| (__\| \|_\| \| _ <\| \|___`
			`* \___\|\___/\|_\| \_\_____\|`
			`*`
			`* Copyright (C) Daniel Stenberg, <daniel@haxx.se>, et al.`
			`*`
			`* This software is licensed as described in the file COPYING, which`
			`* you should have received as part of this distribution. The terms`
			`* are also available at https://curl.se/docs/copyright.html.`
			`*`
			`* You may opt to use, copy, modify, merge, publish, distribute and/or sell`
			`* copies of the Software, and permit persons to whom the Software is`
			`* furnished to do so, under the terms of the COPYING file.`
			`*`
			`* This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY`
			`* KIND, either express or implied.`
			`*`
			`* SPDX-License-Identifier: curl`
			`*`
			`***************************************************************************/`

			`#include "curl_setup.h"`

			`#ifndef CURL_DISABLE_HTTP`

			`#include "urldata.h"`
			`#include <curl/curl.h>`
			`#include "http.h"`
			`#include "http1.h"`
			`#include "urlapi-int.h"`

			`/* The last 3 #include files should be in this order */`
			`#include "curl_printf.h"`
			`#include "curl_memory.h"`
			`#include "memdebug.h"`


			`#define H1_MAX_URL_LEN (8*1024)`

			`void Curl_h1_req_parse_init(struct h1_req_parser *parser, size_t max_line_len)`
			`{`
			`memset(parser, 0, sizeof(*parser));`
			`parser->max_line_len = max_line_len;`
			`Curl_dyn_init(&parser->scratch, max_line_len);`
			`}`

			`void Curl_h1_req_parse_free(struct h1_req_parser *parser)`
			`{`
			`if(parser) {`
			`Curl_http_req_free(parser->req);`
			`Curl_dyn_free(&parser->scratch);`
			`parser->req = NULL;`
			`parser->done = FALSE;`
			`}`
			`}`

			`static CURLcode trim_line(struct h1_req_parser *parser, int options)`
			`{`
			`DEBUGASSERT(parser->line);`
			`if(parser->line_len) {`
			`if(parser->line[parser->line_len - 1] == '\n')`
			`--parser->line_len;`
			`if(parser->line_len) {`
			`if(parser->line[parser->line_len - 1] == '\r')`
			`--parser->line_len;`
			`else if(options & H1_PARSE_OPT_STRICT)`
			`return CURLE_URL_MALFORMAT;`
			`}`
			`else if(options & H1_PARSE_OPT_STRICT)`
			`return CURLE_URL_MALFORMAT;`
			`}`
			`else if(options & H1_PARSE_OPT_STRICT)`
			`return CURLE_URL_MALFORMAT;`

			`if(parser->line_len > parser->max_line_len) {`
			`return CURLE_URL_MALFORMAT;`
			`}`
			`return CURLE_OK;`
			`}`

			`static ssize_t detect_line(struct h1_req_parser *parser,`
			`const char *buf, const size_t buflen,`
			`CURLcode *err)`
			`{`
			`const char *line_end;`

			`DEBUGASSERT(!parser->line);`
			`line_end = memchr(buf, '\n', buflen);`
			`if(!line_end) {`
			`*err = CURLE_AGAIN;`
			`return -1;`
			`}`
			`parser->line = buf;`
			`parser->line_len = line_end - buf + 1;`
			`*err = CURLE_OK;`
			`return (ssize_t)parser->line_len;`
			`}`

			`static ssize_t next_line(struct h1_req_parser *parser,`
			`const char *buf, const size_t buflen, int options,`
			`CURLcode *err)`
			`{`
			`ssize_t nread = 0;`

			`if(parser->line) {`
			`parser->line = NULL;`
			`parser->line_len = 0;`
			`Curl_dyn_reset(&parser->scratch);`
			`}`

			`nread = detect_line(parser, buf, buflen, err);`
			`if(nread >= 0) {`
			`if(Curl_dyn_len(&parser->scratch)) {`
			`/* append detected line to scratch to have the complete line */`
			`*err = Curl_dyn_addn(&parser->scratch, parser->line, parser->line_len);`
			`if(*err)`
			`return -1;`
			`parser->line = Curl_dyn_ptr(&parser->scratch);`
			`parser->line_len = Curl_dyn_len(&parser->scratch);`
			`}`
			`*err = trim_line(parser, options);`
			`if(*err)`
			`return -1;`
			`}`
			`else if(*err == CURLE_AGAIN) {`
			/* no line end in `buf`, add it to our scratch */
			`err = Curl_dyn_addn(&parser->scratch, (const unsigned char )buf, buflen);`
			`nread = (*err)? -1 : (ssize_t)buflen;`
			`}`
			`return nread;`
			`}`

			`static CURLcode start_req(struct h1_req_parser *parser,`
			`const char *scheme_default, int options)`
			`{`
			`const char p, m, target, hv, scheme, authority, *path;`
			`size_t m_len, target_len, hv_len, scheme_len, authority_len, path_len;`
			`size_t i;`
			`CURLU *url = NULL;`
			`CURLcode result = CURLE_URL_MALFORMAT; /* Use this as default fail */`

			`DEBUGASSERT(!parser->req);`
			`/* line must match: "METHOD TARGET HTTP_VERSION" */`
			`p = memchr(parser->line, ' ', parser->line_len);`
			`if(!p \|\| p == parser->line)`
			`goto out;`

			`m = parser->line;`
			`m_len = p - parser->line;`
			`target = p + 1;`
			`target_len = hv_len = 0;`
			`hv = NULL;`

			`/* URL may contain spaces so scan backwards */`
			`for(i = parser->line_len; i > m_len; --i) {`
			`if(parser->line[i] == ' ') {`
			`hv = &parser->line[i + 1];`
			`hv_len = parser->line_len - i;`
			`target_len = (hv - target) - 1;`
			`break;`
			`}`
			`}`
			`/* no SPACE found or empty TARGET or empty HTTP_VERSION */`
			`if(!target_len \|\| !hv_len)`
			`goto out;`

			`/* TODO: we do not check HTTP_VERSION for conformity, should`
			`+ do that when STRICT option is supplied. */`
			`(void)hv;`

			`/* The TARGET can be (rfc 9112, ch. 3.2):`
			`* origin-form: path + optional query`
			`* absolute-form: absolute URI`
			`* authority-form: host+port for CONNECT`
			`* asterisk-form: '*' for OPTIONS`
			`*`
			* from TARGET, we derive `scheme` `authority` `path`
			`* origin-form -- -- TARGET`
			`* absolute-form URL* URL* URL*`
			`* authority-form -- TARGET --`
			`* asterisk-form -- -- TARGET`
			`*/`
			`scheme = authority = path = NULL;`
			`scheme_len = authority_len = path_len = 0;`

			`if(target_len == 1 && target[0] == '*') {`
			`/* asterisk-form */`
			`path = target;`
			`path_len = target_len;`
			`}`
			`else if(!strncmp("CONNECT", m, m_len)) {`
			`/* authority-form */`
			`authority = target;`
			`authority_len = target_len;`
			`}`
			`else if(target[0] == '/') {`
			`/* origin-form */`
			`path = target;`
			`path_len = target_len;`
			`}`
			`else {`
			`/* origin-form OR absolute-form */`
			`CURLUcode uc;`
			`char tmp[H1_MAX_URL_LEN];`

			`/* default, unless we see an absolute URL */`
			`path = target;`
			`path_len = target_len;`

			`/* URL parser wants 0-termination */`
			`if(target_len >= sizeof(tmp))`
			`goto out;`
			`memcpy(tmp, target, target_len);`
			`tmp[target_len] = '\0';`
			`/* See if treating TARGET as an absolute URL makes sense */`
			`if(Curl_is_absolute_url(tmp, NULL, 0, FALSE)) {`
			`int url_options;`

			`url = curl_url();`
			`if(!url) {`
			`result = CURLE_OUT_OF_MEMORY;`
			`goto out;`
			`}`
			`url_options = (CURLU_NON_SUPPORT_SCHEME\|`
			`CURLU_PATH_AS_IS\|`
			`CURLU_NO_DEFAULT_PORT);`
			`if(!(options & H1_PARSE_OPT_STRICT))`
			`url_options \|= CURLU_ALLOW_SPACE;`
			`uc = curl_url_set(url, CURLUPART_URL, tmp, url_options);`
			`if(uc) {`
			`goto out;`
			`}`
			`}`

			`if(!url && (options & H1_PARSE_OPT_STRICT)) {`
			/* we should have an absolute URL or have seen `/` earlier */
			`goto out;`
			`}`
			`}`

			`if(url) {`
			`result = Curl_http_req_make2(&parser->req, m, m_len, url, scheme_default);`
			`}`
			`else {`
			`if(!scheme && scheme_default) {`
			`scheme = scheme_default;`
			`scheme_len = strlen(scheme_default);`
			`}`
			`result = Curl_http_req_make(&parser->req, m, m_len, scheme, scheme_len,`
			`authority, authority_len, path, path_len);`
			`}`

			`out:`
			`curl_url_cleanup(url);`
			`return result;`
			`}`

			`ssize_t Curl_h1_req_parse_read(struct h1_req_parser *parser,`
			`const char *buf, size_t buflen,`
			`const char *scheme_default, int options,`
			`CURLcode *err)`
			`{`
			`ssize_t nread = 0, n;`

			`*err = CURLE_OK;`
			`while(!parser->done) {`
			`n = next_line(parser, buf, buflen, options, err);`
			`if(n < 0) {`
			`if(*err != CURLE_AGAIN) {`
			`nread = -1;`
			`}`
			`*err = CURLE_OK;`
			`goto out;`
			`}`

			`/* Consume this line */`
			`nread += (size_t)n;`
			`buf += (size_t)n;`
			`buflen -= (size_t)n;`

			`if(!parser->line) {`
			`/* consumed bytes, but line not complete */`
			`if(!buflen)`
			`goto out;`
			`}`
			`else if(!parser->req) {`
			`*err = start_req(parser, scheme_default, options);`
			`if(*err) {`
			`nread = -1;`
			`goto out;`
			`}`
			`}`
			`else if(parser->line_len == 0) {`
			`/* last, empty line, we are finished */`
			`if(!parser->req) {`
			`*err = CURLE_URL_MALFORMAT;`
			`nread = -1;`
			`goto out;`
			`}`
			`parser->done = TRUE;`
			`Curl_dyn_reset(&parser->scratch);`
			`/* last chance adjustments */`
			`}`
			`else {`
			`*err = Curl_dynhds_h1_add_line(&parser->req->headers,`
			`parser->line, parser->line_len);`
			`if(*err) {`
			`nread = -1;`
			`goto out;`
			`}`
			`}`
			`}`

			`out:`
			`return nread;`
			`}`

			`CURLcode Curl_h1_req_write_head(struct httpreq *req, int http_minor,`
			`struct dynbuf *dbuf)`
			`{`
			`CURLcode result;`

			`result = Curl_dyn_addf(dbuf, "%s %s%s%s%s HTTP/1.%d\r\n",`
			`req->method,`
			`req->scheme? req->scheme : "",`
			`req->scheme? "://" : "",`
			`req->authority? req->authority : "",`
			`req->path? req->path : "",`
			`http_minor);`
			`if(result)`
			`goto out;`

			`result = Curl_dynhds_h1_dprint(&req->headers, dbuf);`
			`if(result)`
			`goto out;`

			`result = Curl_dyn_addn(dbuf, STRCONST("\r\n"));`

			`out:`
			`return result;`
			`}`

			`#endif /* !CURL_DISABLE_HTTP */`