url: use the URL API internally as well

... to make it a truly unified URL parser. Closes #3017
2024-08-13 17:03:50 -04:00 · 2018-09-14 23:33:28 +02:00 · 2018-09-14 23:33:28 +02:00 · 46e164069d
commit 46e164069d
parent f078361c0e
22 changed files with 386 additions and 928 deletions
--- a/lib/curl_path.c
+++ b/lib/curl_path.c
@ -5,7 +5,7 @@
 *                            | (__| |_| |  _ <| |___
 *                             \___|\___/|_| \_\_____|
 *
- * Copyright (C) 1998 - 2017, Daniel Stenberg, <daniel@haxx.se>, et al.
+ * Copyright (C) 1998 - 2018, Daniel Stenberg, <daniel@haxx.se>, et al.
 *
 * This software is licensed as described in the file COPYING, which
 * you should have received as part of this distribution. The terms
@ -39,7 +39,7 @@ CURLcode Curl_getworkingpath(struct connectdata *conn,
  char *working_path;
  size_t working_path_len;
  CURLcode result =
-    Curl_urldecode(data, data->state.path, 0, &working_path,
+    Curl_urldecode(data, data->state.up.path, 0, &working_path,
                   &working_path_len, FALSE);
  if(result)
    return result;
--- a/lib/dict.c
+++ b/lib/dict.c
@ -136,7 +136,7 @@ static CURLcode dict_do(struct connectdata *conn, bool *done)
  struct Curl_easy *data = conn->data;
  curl_socket_t sockfd = conn->sock[FIRSTSOCKET];
-  char *path = data->state.path;
+  char *path = data->state.up.path;
  curl_off_t *bytecount = &data->req.bytecount;
  *done = TRUE; /* unconditionally */
--- a/lib/easy.c
+++ b/lib/easy.c
@ -1002,10 +1002,6 @@ struct Curl_easy *curl_easy_duphandle(struct Curl_easy *data)
 */
 void curl_easy_reset(struct Curl_easy *data)
 {
  Curl_safefree(data->state.pathbuffer);
  data->state.path = NULL;
  Curl_free_request_state(data);
  /* zero out UserDefined data: */
--- a/lib/file.c
+++ b/lib/file.c
@ -143,7 +143,7 @@ static CURLcode file_connect(struct connectdata *conn, bool *done)
 #endif
  size_t real_path_len;
-  CURLcode result = Curl_urldecode(data, data->state.path, 0, &real_path,
+  CURLcode result = Curl_urldecode(data, data->state.up.path, 0, &real_path,
                                   &real_path_len, FALSE);
  if(result)
    return result;
@ -197,7 +197,7 @@ static CURLcode file_connect(struct connectdata *conn, bool *done)
  file->fd = fd;
  if(!data->set.upload && (fd == -1)) {
-    failf(data, "Couldn't open file %s", data->state.path);
+    failf(data, "Couldn't open file %s", data->state.up.path);
    file_done(conn, CURLE_FILE_COULDNT_READ_FILE, FALSE);
    return CURLE_FILE_COULDNT_READ_FILE;
  }
--- a/lib/ftp.c
+++ b/lib/ftp.c
@ -1444,6 +1444,7 @@ static CURLcode ftp_state_list(struct connectdata *conn)
 {
  CURLcode result = CURLE_OK;
  struct Curl_easy *data = conn->data;
  struct FTP *ftp = data->req.protop;
  /* If this output is to be machine-parsed, the NLST command might be better
     to use, since the LIST command output is not specified or standard in any
@ -1460,7 +1461,7 @@ static CURLcode ftp_state_list(struct connectdata *conn)
     then just do LIST (in that case: nothing to do here)
  */
  char *cmd, *lstArg, *slashPos;
-  const char *inpath = data->state.path;
+  const char *inpath = ftp->path;
  lstArg = NULL;
  if((data->set.ftp_filemethod == FTPFILE_NOCWD) &&
@ -3141,7 +3142,7 @@ static CURLcode ftp_done(struct connectdata *conn, CURLcode status,
  int ftpcode;
  CURLcode result = CURLE_OK;
  char *path = NULL;
-  const char *path_to_use = data->state.path;
+  const char *path_to_use = ftp->path;
  if(!ftp)
    return CURLE_OK;
@ -3346,7 +3347,7 @@ static CURLcode ftp_done(struct connectdata *conn, CURLcode status,
  /* Send any post-transfer QUOTE strings? */
  if(!status && !result && !premature && data->set.postquote)
    result = ftp_sendquote(conn, data->set.postquote);
-
+  Curl_safefree(ftp->pathalloc);
  return result;
 }
@ -3695,12 +3696,13 @@ static void wc_data_dtor(void *ptr)
 static CURLcode init_wc_data(struct connectdata *conn)
 {
  char *last_slash;
-  char *path = conn->data->state.path;
+  struct FTP *ftp = conn->data->req.protop;
  char *path = ftp->path;
  struct WildcardData *wildcard = &(conn->data->wildcard);
  CURLcode result = CURLE_OK;
  struct ftp_wc *ftpwc = NULL;
-  last_slash = strrchr(conn->data->state.path, '/');
+  last_slash = strrchr(ftp->path, '/');
  if(last_slash) {
    last_slash++;
    if(last_slash[0] == '\0') {
@ -3757,7 +3759,7 @@ static CURLcode init_wc_data(struct connectdata *conn)
    goto fail;
  }
-  wildcard->path = strdup(conn->data->state.path);
+  wildcard->path = strdup(ftp->path);
  if(!wildcard->path) {
    result = CURLE_OUT_OF_MEMORY;
    goto fail;
@ -3828,16 +3830,15 @@ static CURLcode wc_statemach(struct connectdata *conn)
    /* filelist has at least one file, lets get first one */
    struct ftp_conn *ftpc = &conn->proto.ftpc;
    struct curl_fileinfo *finfo = wildcard->filelist.head->ptr;
    struct FTP *ftp = conn->data->req.protop;
    char *tmp_path = aprintf("%s%s", wildcard->path, finfo->filename);
    if(!tmp_path)
      return CURLE_OUT_OF_MEMORY;
-    /* switch default "state.pathbuffer" and tmp_path, good to see
+    /* switch default ftp->path and tmp_path */
-       ftp_parse_url_path function to understand this trick */
+    free(ftp->pathalloc);
-    Curl_safefree(conn->data->state.pathbuffer);
+    ftp->pathalloc = ftp->path = tmp_path;
    conn->data->state.pathbuffer = tmp_path;
    conn->data->state.path = tmp_path;
    infof(conn->data, "Wildcard - START of \"%s\"\n", finfo->filename);
    if(conn->data->set.chunk_bgn) {
@ -4105,7 +4106,7 @@ CURLcode ftp_parse_url_path(struct connectdata *conn)
  struct FTP *ftp = data->req.protop;
  struct ftp_conn *ftpc = &conn->proto.ftpc;
  const char *slash_pos;  /* position of the first '/' char in curpos */
-  const char *path_to_use = data->state.path;
+  const char *path_to_use = ftp->path;
  const char *cur_pos;
  const char *filename = NULL;
@ -4191,7 +4192,7 @@ CURLcode ftp_parse_url_path(struct connectdata *conn)
      /* parse the URL path into separate path components */
      while((slash_pos = strchr(cur_pos, '/')) != NULL) {
        /* 1 or 0 pointer offset to indicate absolute directory */
-        ssize_t absolute_dir = ((cur_pos - data->state.path > 0) &&
+        ssize_t absolute_dir = ((cur_pos - ftp->path > 0) &&
                                (ftpc->dirdepth == 0))?1:0;
        /* seek out the next path component */
@ -4268,7 +4269,7 @@ CURLcode ftp_parse_url_path(struct connectdata *conn)
    size_t dlen;
    char *path;
    CURLcode result =
-      Curl_urldecode(conn->data, data->state.path, 0, &path, &dlen, TRUE);
+      Curl_urldecode(conn->data, ftp->path, 0, &path, &dlen, TRUE);
    if(result) {
      freedirs(ftpc);
      return result;
@ -4388,16 +4389,16 @@ static CURLcode ftp_setup_connection(struct connectdata *conn)
  char *type;
  struct FTP *ftp;
-  conn->data->req.protop = ftp = malloc(sizeof(struct FTP));
+  conn->data->req.protop = ftp = calloc(sizeof(struct FTP), 1);
  if(NULL == ftp)
    return CURLE_OUT_OF_MEMORY;
-  data->state.path++;   /* don't include the initial slash */
+  ftp->path = &data->state.up.path[1]; /* don't include the initial slash */
  data->state.slash_removed = TRUE; /* we've skipped the slash */
  /* FTP URLs support an extension like ";type=<typecode>" that
   * we'll try to get now! */
-  type = strstr(data->state.path, ";type=");
+  type = strstr(ftp->path, ";type=");
  if(!type)
    type = strstr(conn->host.rawalloc, ";type=");
--- a/lib/ftp.h
+++ b/lib/ftp.h
@ -105,6 +105,8 @@ struct FTP {
  curl_off_t *bytecountp;
  char *user;    /* user name string */
  char *passwd;  /* password string */
  char *path;    /* points to the urlpieces struct field */
  char *pathalloc; /* if non-NULL a pointer to an allocated path */
  /* transfer a file/body or not, done as a typedefed enum just to make
     debuggers display the full symbol and not just the numerical value */
--- a/lib/gopher.c
+++ b/lib/gopher.c
@ -78,7 +78,7 @@ static CURLcode gopher_do(struct connectdata *conn, bool *done)
  curl_socket_t sockfd = conn->sock[FIRSTSOCKET];
  curl_off_t *bytecount = &data->req.bytecount;
-  char *path = data->state.path;
+  char *path = data->state.up.path;
  char *sel = NULL;
  char *sel_org = NULL;
  ssize_t amount, k;
--- a/lib/http.c
+++ b/lib/http.c
@ -1877,7 +1877,8 @@ CURLcode Curl_http(struct connectdata *conn, bool *done)
  struct Curl_easy *data = conn->data;
  CURLcode result = CURLE_OK;
  struct HTTP *http;
-  const char *ppath = data->state.path;
+  const char *path = data->state.up.path;
  const char *query = data->state.up.query;
  bool paste_ftp_userpwd = FALSE;
  char ftp_typecode[sizeof("/;type=?")] = "";
  const char *host = conn->host.name;
@ -1995,7 +1996,7 @@ CURLcode Curl_http(struct connectdata *conn, bool *done)
  }
  /* setup the authentication headers */
-  result = Curl_http_output_auth(conn, request, ppath, FALSE);
+  result = Curl_http_output_auth(conn, request, path, FALSE);
  if(result)
    return result;
@ -2223,47 +2224,59 @@ CURLcode Curl_http(struct connectdata *conn, bool *done)
    /* The path sent to the proxy is in fact the entire URL. But if the remote
       host is a IDN-name, we must make sure that the request we produce only
       uses the encoded host name! */
    /* and no fragment part */
    CURLUcode uc;
    char *url;
    CURLU *h = curl_url_dup(data->state.uh);
    if(!h)
      return CURLE_OUT_OF_MEMORY;
    if(conn->host.dispname != conn->host.name) {
-      char *url = data->change.url;
+      uc = curl_url_set(h, CURLUPART_HOST, conn->host.name, 0);
-      ptr = strstr(url, conn->host.dispname);
+      if(uc) {
-      if(ptr) {
+        curl_url_cleanup(h);
-        /* This is where the display name starts in the URL, now replace this
+        return CURLE_OUT_OF_MEMORY;
           part with the encoded name. TODO: This method of replacing the host
           name is rather crude as I believe there's a slight risk that the
           user has entered a user name or password that contain the host name
           string. */
        size_t currlen = strlen(conn->host.dispname);
        size_t newlen = strlen(conn->host.name);
        size_t urllen = strlen(url);
        char *newurl;
        newurl = malloc(urllen + newlen - currlen + 1);
        if(newurl) {
          /* copy the part before the host name */
          memcpy(newurl, url, ptr - url);
          /* append the new host name instead of the old */
          memcpy(newurl + (ptr - url), conn->host.name, newlen);
          /* append the piece after the host name */
          memcpy(newurl + newlen + (ptr - url),
                 ptr + currlen, /* copy the trailing zero byte too */
                 urllen - (ptr-url) - currlen + 1);
          if(data->change.url_alloc) {
            Curl_safefree(data->change.url);
            data->change.url_alloc = FALSE;
          }
          data->change.url = newurl;
          data->change.url_alloc = TRUE;
        }
        else
          return CURLE_OUT_OF_MEMORY;
      }
    }
-    ppath = data->change.url;
+    uc = curl_url_set(h, CURLUPART_FRAGMENT, NULL, 0);
-    if(checkprefix("ftp://", ppath)) {
+    if(uc) {
      curl_url_cleanup(h);
      return CURLE_OUT_OF_MEMORY;
    }
    if(strcasecompare("http", data->state.up.scheme)) {
      /* when getting HTTP, we don't want the userinfo the URL */
      uc = curl_url_set(h, CURLUPART_USER, NULL, 0);
      if(uc) {
        curl_url_cleanup(h);
        return CURLE_OUT_OF_MEMORY;
      }
      uc = curl_url_set(h, CURLUPART_PASSWORD, NULL, 0);
      if(uc) {
        curl_url_cleanup(h);
        return CURLE_OUT_OF_MEMORY;
      }
    }
    /* now extract the new version of the URL */
    uc = curl_url_get(h, CURLUPART_URL, &url, 0);
    if(uc) {
      curl_url_cleanup(h);
      return CURLE_OUT_OF_MEMORY;
    }
    if(data->change.url_alloc)
      free(data->change.url);
    data->change.url = url;
    data->change.url_alloc = TRUE;
    curl_url_cleanup(h);
    if(strcasecompare("ftp", data->state.up.scheme)) {
      if(data->set.proxy_transfer_mode) {
        /* when doing ftp, append ;type=<a|i> if not present */
-        char *type = strstr(ppath, ";type=");
+        char *type = strstr(path, ";type=");
        if(type && type[6] && type[7] == 0) {
          switch(Curl_raw_toupper(type[6])) {
          case 'A':
@ -2278,7 +2291,7 @@ CURLcode Curl_http(struct connectdata *conn, bool *done)
          char *p = ftp_typecode;
          /* avoid sending invalid URLs like ftp://example.com;type=i if the
           * user specified ftp://example.com without the slash */
-          if(!*data->state.path && ppath[strlen(ppath) - 1] != '/') {
+          if(!*data->state.up.path && path[strlen(path) - 1] != '/') {
            *p++ = '/';
          }
          snprintf(p, sizeof(ftp_typecode) - 1, ";type=%c",
@ -2431,18 +2444,32 @@ CURLcode Curl_http(struct connectdata *conn, bool *done)
  if(result)
    return result;
-  if(data->set.str[STRING_TARGET])
+  if(data->set.str[STRING_TARGET]) {
-    ppath = data->set.str[STRING_TARGET];
+    path = data->set.str[STRING_TARGET];
    query = NULL;
  }
  /* url */
-  if(paste_ftp_userpwd)
+  if(conn->bits.httpproxy && !conn->bits.tunnel_proxy) {
    char *url = data->change.url;
    result = Curl_add_buffer(&req_buffer, url, strlen(url));
    if(result)
      return result;
  }
  else if(paste_ftp_userpwd)
    result = Curl_add_bufferf(&req_buffer, "ftp://%s:%s@%s",
                              conn->user, conn->passwd,
-                              ppath + sizeof("ftp://") - 1);
+                              path + sizeof("ftp://") - 1);
-  else
+  else {
-    result = Curl_add_buffer(&req_buffer, ppath, strlen(ppath));
+    result = Curl_add_buffer(&req_buffer, path, strlen(path));
-  if(result)
+    if(result)
-    return result;
+      return result;
    if(query) {
      result = Curl_add_bufferf(&req_buffer, "?%s", query);
      if(result)
        return result;
    }
  }
  result =
    Curl_add_bufferf(&req_buffer,
@ -2515,7 +2542,7 @@ CURLcode Curl_http(struct connectdata *conn, bool *done)
      co = Curl_cookie_getlist(data->cookies,
                               conn->allocptr.cookiehost?
                               conn->allocptr.cookiehost:host,
-                               data->state.path,
+                               data->state.up.path,
                               (conn->handler->protocol&CURLPROTO_HTTPS)?
                               TRUE:FALSE);
      Curl_share_unlock(data, CURL_LOCK_DATA_COOKIE);
@ -3836,7 +3863,7 @@ CURLcode Curl_http_readwrite_headers(struct Curl_easy *data,
                         here, or else use real peer host name. */
                      conn->allocptr.cookiehost?
                      conn->allocptr.cookiehost:conn->host.name,
-                      data->state.path);
+                      data->state.up.path);
      Curl_share_unlock(data, CURL_LOCK_DATA_COOKIE);
    }
 #endif
--- a/lib/imap.c
+++ b/lib/imap.c
@ -1717,8 +1717,6 @@ static CURLcode imap_regular_transfer(struct connectdata *conn,
 static CURLcode imap_setup_connection(struct connectdata *conn)
 {
  struct Curl_easy *data = conn->data;
  /* Initialise the IMAP layer */
  CURLcode result = imap_init(conn);
  if(result)
@ -1726,7 +1724,6 @@ static CURLcode imap_setup_connection(struct connectdata *conn)
  /* Clear the TLS upgraded flag */
  conn->tls_upgraded = FALSE;
  data->state.path++;   /* don't include the initial slash */
  return CURLE_OK;
 }
@ -1959,7 +1956,7 @@ static CURLcode imap_parse_url_path(struct connectdata *conn)
  CURLcode result = CURLE_OK;
  struct Curl_easy *data = conn->data;
  struct IMAP *imap = data->req.protop;
-  const char *begin = data->state.path;
+  const char *begin = &data->state.up.path[1]; /* skip leading slash */
  const char *ptr = begin;
  /* See how much of the URL is a valid path and decode it */
@ -2065,17 +2062,10 @@ static CURLcode imap_parse_url_path(struct connectdata *conn)
  /* Does the URL contain a query parameter? Only valid when we have a mailbox
     and no UID as per RFC-5092 */
-  if(imap->mailbox && !imap->uid && !imap->mindex && *ptr == '?') {
+  if(imap->mailbox && !imap->uid && !imap->mindex) {
-    /* Find the length of the query parameter */
+    /* Get the query parameter, URL decoded */
-    begin = ++ptr;
+    (void)curl_url_get(data->state.uh, CURLUPART_QUERY, &imap->query,
-    while(imap_is_bchar(*ptr))
+                       CURLU_URLDECODE);
      ptr++;
    /* Decode the query parameter */
    result = Curl_urldecode(data, begin, ptr - begin, &imap->query, NULL,
                            TRUE);
    if(result)
      return result;
  }
  /* Any extra stuff at the end of the URL is an error */
--- a/lib/ldap.c
+++ b/lib/ldap.c
@ -5,7 +5,7 @@
 *                | (__| |_| |  _ <| |___
 *                 \___|\___/|_| \_\_____|
 *
- * Copyright (C) 1998 - 2017, Daniel Stenberg, <daniel@haxx.se>, et al.
+ * Copyright (C) 1998 - 2018, Daniel Stenberg, <daniel@haxx.se>, et al.
 *
 * This software is licensed as described in the file COPYING, which
 * you should have received as part of this distribution. The terms
@ -838,9 +838,9 @@ static int _ldap_url_parse2(const struct connectdata *conn, LDAPURLDesc *ludp)
  size_t i;
  if(!conn->data ||
-     !conn->data->state.path ||
+     !conn->data->state.up.path ||
-     conn->data->state.path[0] != '/' ||
+     conn->data->state.up.path[0] != '/' ||
-     !checkprefix("LDAP", conn->data->change.url))
+     !strcasecompare("LDAP", conn->data->state.up.scheme))
    return LDAP_INVALID_SYNTAX;
  ludp->lud_scope = LDAP_SCOPE_BASE;
@ -848,7 +848,7 @@ static int _ldap_url_parse2(const struct connectdata *conn, LDAPURLDesc *ludp)
  ludp->lud_host  = conn->host.name;
  /* Duplicate the path */
-  p = path = strdup(conn->data->state.path + 1);
+  p = path = strdup(conn->data->state.up.path + 1);
  if(!path)
    return LDAP_NO_MEMORY;
--- a/lib/multi.c
+++ b/lib/multi.c
@ -542,10 +542,8 @@ static CURLcode multi_done(struct connectdata **connp,
  Curl_getoff_all_pipelines(data, conn);
  /* Cleanup possible redirect junk */
-  free(data->req.newurl);
+  Curl_safefree(data->req.newurl);
-  data->req.newurl = NULL;
+  Curl_safefree(data->req.location);
  free(data->req.location);
  data->req.location = NULL;
  switch(status) {
  case CURLE_ABORTED_BY_CALLBACK:
@ -657,7 +655,6 @@ static CURLcode multi_done(struct connectdata **connp,
                    cache here, and therefore cannot be used from this point on
                 */
  Curl_free_request_state(data);
  return result;
 }
@ -2015,8 +2012,6 @@ static CURLMcode multi_runsingle(struct Curl_multi *multi,
      }
      else if(comeback)
        rc = CURLM_CALL_MULTI_PERFORM;
      free(newurl);
      break;
    }
--- a/lib/pop3.c
+++ b/lib/pop3.c
@ -1303,8 +1303,6 @@ static CURLcode pop3_regular_transfer(struct connectdata *conn,
 static CURLcode pop3_setup_connection(struct connectdata *conn)
 {
  struct Curl_easy *data = conn->data;
  /* Initialise the POP3 layer */
  CURLcode result = pop3_init(conn);
  if(result)
@ -1312,7 +1310,6 @@ static CURLcode pop3_setup_connection(struct connectdata *conn)
  /* Clear the TLS upgraded flag */
  conn->tls_upgraded = FALSE;
  data->state.path++;   /* don't include the initial slash */
  return CURLE_OK;
 }
@ -1387,7 +1384,7 @@ static CURLcode pop3_parse_url_path(struct connectdata *conn)
  /* The POP3 struct is already initialised in pop3_connect() */
  struct Curl_easy *data = conn->data;
  struct POP3 *pop3 = data->req.protop;
-  const char *path = data->state.path;
+  const char *path = &data->state.up.path[1]; /* skip leading path */
  /* URL decode the path for the message ID */
  return Curl_urldecode(data, path, 0, &pop3->id, NULL, TRUE);
--- a/lib/smb.c
+++ b/lib/smb.c
@ -969,7 +969,7 @@ static CURLcode smb_parse_url_path(struct connectdata *conn)
  char *slash;
  /* URL decode the path */
-  result = Curl_urldecode(data, data->state.path, 0, &path, NULL, TRUE);
+  result = Curl_urldecode(data, data->state.up.path, 0, &path, NULL, TRUE);
  if(result)
    return result;
--- a/lib/smtp.c
+++ b/lib/smtp.c
@ -1441,7 +1441,6 @@ static CURLcode smtp_regular_transfer(struct connectdata *conn,
 static CURLcode smtp_setup_connection(struct connectdata *conn)
 {
  struct Curl_easy *data = conn->data;
  CURLcode result;
  /* Clear the TLS upgraded flag */
@ -1452,8 +1451,6 @@ static CURLcode smtp_setup_connection(struct connectdata *conn)
  if(result)
    return result;
  data->state.path++;   /* don't include the initial slash */
  return CURLE_OK;
 }
@ -1507,7 +1504,7 @@ static CURLcode smtp_parse_url_path(struct connectdata *conn)
  /* The SMTP struct is already initialised in smtp_connect() */
  struct Curl_easy *data = conn->data;
  struct smtp_conn *smtpc = &conn->proto.smtpc;
-  const char *path = data->state.path;
+  const char *path = &data->state.up.path[1]; /* skip leading path */
  char localhost[HOSTNAME_MAX + 1];
  /* Calculate the path if necessary */
--- a/lib/tftp.c
+++ b/lib/tftp.c
@ -485,7 +485,7 @@ static CURLcode tftp_send_first(tftp_state_data_t *state, tftp_event_t event)
    /* As RFC3617 describes the separator slash is not actually part of the
       file name so we skip the always-present first letter of the path
       string. */
-    result = Curl_urldecode(data, &state->conn->data->state.path[1], 0,
+    result = Curl_urldecode(data, &state->conn->data->state.up.path[1], 0,
                            &filename, NULL, FALSE);
    if(result)
      return result;
@ -1374,7 +1374,7 @@ static CURLcode tftp_setup_connection(struct connectdata * conn)
  /* TFTP URLs support an extension like ";mode=<typecode>" that
   * we'll try to get now! */
-  type = strstr(data->state.path, ";mode=");
+  type = strstr(data->state.up.path, ";mode=");
  if(!type)
    type = strstr(conn->host.rawalloc, ";mode=");
--- a/lib/transfer.c
+++ b/lib/transfer.c
@ -567,7 +567,7 @@ static CURLcode readwrite_data(struct Curl_easy *data,
            infof(data,
                  "Rewinding stream by : %zd"
                  " bytes on url %s (zero-length body)\n",
-                  nread, data->state.path);
+                  nread, data->state.up.path);
            read_rewind(conn, (size_t)nread);
          }
          else {
@ -575,7 +575,7 @@ static CURLcode readwrite_data(struct Curl_easy *data,
                  "Excess found in a non pipelined read:"
                  " excess = %zd"
                  " url = %s (zero-length body)\n",
-                  nread, data->state.path);
+                  nread, data->state.up.path);
          }
        }
@ -744,7 +744,7 @@ static CURLcode readwrite_data(struct Curl_easy *data,
                  " bytes on url %s (size = %" CURL_FORMAT_CURL_OFF_T
                  ", maxdownload = %" CURL_FORMAT_CURL_OFF_T
                  ", bytecount = %" CURL_FORMAT_CURL_OFF_T ", nread = %zd)\n",
-                  excess, data->state.path,
+                  excess, data->state.up.path,
                  k->size, k->maxdownload, k->bytecount, nread);
            read_rewind(conn, excess);
          }
@ -1474,6 +1474,7 @@ CURLcode Curl_follow(struct Curl_easy *data,
  /* Location: redirect */
  bool disallowport = FALSE;
  bool reachedmax = FALSE;
  CURLUcode uc;
  if(type == FOLLOW_REDIR) {
    if((data->set.maxredirs != -1) &&
@ -1506,33 +1507,21 @@ CURLcode Curl_follow(struct Curl_easy *data,
    }
  }
-  if(!Curl_is_absolute_url(newurl, NULL, 8)) {
+  if(Curl_is_absolute_url(newurl, NULL, MAX_SCHEME_LEN))
    /***
     *DANG* this is an RFC 2068 violation. The URL is supposed
     to be absolute and this doesn't seem to be that!
     */
    char *absolute = Curl_concat_url(data->change.url, newurl);
    if(!absolute)
      return CURLE_OUT_OF_MEMORY;
    newurl = absolute;
  }
  else {
    /* The new URL MAY contain space or high byte values, that means a mighty
       stupid redirect URL but we still make an effort to do "right". */
    char *newest;
    size_t newlen = Curl_strlen_url(newurl, FALSE);
    /* This is an absolute URL, don't allow the custom port number */
    disallowport = TRUE;
-    newest = malloc(newlen + 1); /* get memory for this */
+  DEBUGASSERT(data->state.uh);
-    if(!newest)
+  uc = curl_url_set(data->state.uh, CURLUPART_URL, newurl, 0);
-      return CURLE_OUT_OF_MEMORY;
+  free(newurl);
  if(uc)
    /* TODO: consider an error code remap here */
    return CURLE_URL_MALFORMAT;
-    Curl_strcpy_url(newest, newurl, FALSE); /* create a space-free URL */
+  uc = curl_url_get(data->state.uh, CURLUPART_URL, &newurl, 0);
-    newurl = newest; /* use this instead now */
+  if(uc)
-
+    /* TODO: consider an error code remap here */
-  }
+    return CURLE_OUT_OF_MEMORY;
  if(type == FOLLOW_FAKE) {
    /* we're only figuring out the new url if we would've followed locations
@ -1549,10 +1538,8 @@ CURLcode Curl_follow(struct Curl_easy *data,
  if(disallowport)
    data->state.allow_port = FALSE;
-  if(data->change.url_alloc) {
+  if(data->change.url_alloc)
    Curl_safefree(data->change.url);
    data->change.url_alloc = FALSE;
  }
  data->change.url = newurl;
  data->change.url_alloc = TRUE;
--- a/lib/url.c
+++ b/lib/url.c
--- a/lib/url.h
+++ b/lib/url.h
@ -48,6 +48,8 @@ CURLcode Curl_open(struct Curl_easy **curl);
 CURLcode Curl_init_userdefined(struct Curl_easy *data);
 void Curl_freeset(struct Curl_easy * data);
 /* free the URL pieces */
 void Curl_up_free(struct Curl_easy *data);
 CURLcode Curl_close(struct Curl_easy *data); /* opposite of curl_open() */
 CURLcode Curl_connect(struct Curl_easy *, struct connectdata **,
                      bool *async, bool *protocol_connect);
--- a/lib/urldata.h
+++ b/lib/urldata.h
@ -1224,6 +1224,18 @@ struct time_node {
  expire_id eid;
 };
 /* individual pieces of the URL */
 struct urlpieces {
  char *scheme;
  char *hostname;
  char *port;
  char *user;
  char *password;
  char *options;
  char *path;
  char *query;
 };
 struct UrlState {
  /* Points to the connection cache */
@ -1314,9 +1326,6 @@ struct UrlState {
  /* for FTP downloads: how many CRLFs did we converted to LFs? */
  curl_off_t crlf_conversions;
 #endif
  char *pathbuffer;/* allocated buffer to store the URL's path part in */
  char *path;      /* path to use, points to somewhere within the pathbuffer
                      area */
  bool slash_removed; /* set TRUE if the 'path' points to a path where the
                         initial URL slash separator has been taken off */
  bool use_range;
@ -1350,6 +1359,8 @@ struct UrlState {
 #ifdef CURLDEBUG
  bool conncache_lock;
 #endif
  CURLU *uh; /* URL handle for the current parsed URL */
  struct urlpieces up;
 };
--- a/tests/data/test325
+++ b/tests/data/test325
@ -15,7 +15,7 @@ HTTP/1.1 301 OK
 Date: Thu, 09 Nov 2010 14:49:00 GMT
 Server: test-server/fake
 Content-Length: 7
-Location: http://%HOSTIP:%HTTPPORT/325
+Location: http://somewhere/325
 MooMoo
 </data>
@ -24,7 +24,7 @@ HTTP/1.1 301 OK
 Date: Thu, 09 Nov 2010 14:49:00 GMT
 Server: test-server/fake
 Content-Length: 7
-Location: http://%HOSTIP:%HTTPPORT/325
+Location: http://somewhere/325
 </datacheck>
 </reply>
--- a/tests/data/test523
+++ b/tests/data/test523
@ -39,7 +39,7 @@ HTTP GET with proxy and CURLOPT_PORT
 </name>
 # first URL then proxy
 <command>
-http://www.example.com:999/523 http://%HOSTIP:%HTTPPORT 
+http://www.example.com:999/523 http://%HOSTIP:%HTTPPORT
 </command>
 </client>
@ -50,7 +50,7 @@ http://www.example.com:999/523 http://%HOSTIP:%HTTPPORT
 ^User-Agent:.*
 </strip>
 <protocol>
-GET HTTP://www.example.com:19999/523 HTTP/1.1
+GET http://www.example.com:19999/523 HTTP/1.1
 Host: www.example.com:19999
 Authorization: Basic eHh4Onl5eQ==
 Accept: */*
--- a/tests/data/test563
+++ b/tests/data/test563
@ -47,7 +47,7 @@ ftp_proxy=http://%HOSTIP:%HTTPPORT/
 # Verify data after the test has been "shot"
 <verify>
 <protocol>
-GET FTP://%HOSTIP:%FTPPORT/563;type=A HTTP/1.1
+GET ftp://%HOSTIP:%FTPPORT/563;type=A HTTP/1.1
 Host: %HOSTIP:%FTPPORT
 Accept: */*
 Proxy-Connection: Keep-Alive