public inbox for libc-alpha@sourceware.org
 help / color / mirror / Atom feed
From: Adhemerval Zanella <adhemerval.zanella@linaro.org>
To: libc-alpha@sourceware.org
Subject: Re: [PATCH 4/4] stdlib: Remove lstat usage from realpath [BZ #24970]
Date: Tue, 27 Oct 2020 09:59:46 -0300	[thread overview]
Message-ID: <227ca5fc-0741-ac67-8417-cb4c19c5f217@linaro.org> (raw)
In-Reply-To: <20200910151915.1982465-4-adhemerval.zanella@linaro.org>

Ping.

On 10/09/2020 12:19, Adhemerval Zanella wrote:
> The readlink already tells whether the file is a symlink, so there is
> no need to call lstat to check it.  However for '..' it requires an
> extra readlink check if the previous component can be really accessed,
> otherwise the next iteration will check a possible valid path and end
> early.  It should performance-wise acceptable and a gain over lstat,
> afaik symlink should not update any inode information.
> 
> Checked on x86_64-linux-gnu and i686-linux-gnu.
> ---
>  stdlib/canonicalize.c | 52 ++++++++++++++++++++++---------------------
>  1 file changed, 27 insertions(+), 25 deletions(-)
> 
> diff --git a/stdlib/canonicalize.c b/stdlib/canonicalize.c
> index 44a25a9a59..952f4dca41 100644
> --- a/stdlib/canonicalize.c
> +++ b/stdlib/canonicalize.c
> @@ -55,6 +55,7 @@ __realpath (const char *name, char *resolved)
>    const char *start, *end, *rpath_limit;
>    const size_t path_max = PATH_MAX;
>    int num_links = 0;
> +  char buf[PATH_MAX];
>    char extra_buf[PATH_MAX];
>  
>    if (name == NULL)
> @@ -104,12 +105,6 @@ __realpath (const char *name, char *resolved)
>  
>    for (end = start; *start; start = end)
>      {
> -#ifdef _LIBC
> -      struct stat64 st;
> -#else
> -      struct stat st;
> -#endif
> -
>        /* Skip sequence of multiple path-separators.  */
>        while (*start == '/')
>          ++start;
> @@ -118,12 +113,25 @@ __realpath (const char *name, char *resolved)
>        for (end = start; *end && *end != '/'; ++end)
>          /* Nothing.  */;
>  
> -      if (end - start == 0)
> -        break;
> -      else if (end - start == 1 && start[0] == '.')
> +      if (end - start == 1 && start[0] == '.')
>          /* nothing */;
>        else if (end - start == 2 && start[0] == '.' && start[1] == '.')
>          {
> +          ssize_t n;
> +
> +          if (dest[-1] != '/')
> +            *dest++ = '/';
> +          *dest = '\0';
> +
> +          n = __readlink (rpath, buf, path_max - 1);
> +          if (n == -1)
> +            {
> +              if (errno == ENOTDIR && dest[-1] == '/')
> +                dest[-1] = '\0';
> +              if (errno != EINVAL)
> +                goto error;
> +            }
> +
>            /* Back up to previous component, ignore if at root already.  */
>            if (dest > rpath + 1)
>              for (--dest; dest > rpath && dest[-1] != '/'; --dest)
> @@ -132,6 +140,7 @@ __realpath (const char *name, char *resolved)
>        else
>          {
>            size_t new_size;
> +          ssize_t n;
>  
>            if (dest[-1] != '/')
>              *dest++ = '/';
> @@ -166,25 +175,23 @@ __realpath (const char *name, char *resolved)
>            dest = __mempcpy (dest, start, end - start);
>            *dest = '\0';
>  
> -          if (__lxstat64 (_STAT_VER, rpath, &st) < 0)
> -            goto error;
> -
> -          if (S_ISLNK (st.st_mode))
> +          n = __readlink (rpath, buf, path_max - 1);
> +          if (n < 0)
> +            {
> +              if (errno == ENOTDIR && dest[-1] == '/')
> +                dest[-1] = '\0';
> +              if (errno != EINVAL)
> +                goto error;
> +            }
> +          else
>              {
> -              char buf[PATH_MAX];
>                size_t len;
> -              ssize_t n;
>  
>                if (++num_links > __eloop_threshold ())
>                  {
>                    __set_errno (ELOOP);
>                    goto error;  }
>  
> -              n = __readlink (rpath, buf, path_max - 1);
> -              if (n < 0)
> -                goto error;
> -              buf[n] = '\0';
> -
>                len = strlen (end);
>                /* Check that n + len + 1 doesn't overflow and is <= path_max. */
>                if (n >= SIZE_MAX - len || n + len >= path_max)
> @@ -211,11 +218,6 @@ __realpath (const char *name, char *resolved)
>                        continue;
>                  }
>              }
> -          else if (!S_ISDIR (st.st_mode) && *end != '\0')
> -            {
> -              __set_errno (ENOTDIR);
> -              goto error;
> -            }
>          }
>      }
>    if (dest > rpath + 1 && dest[-1] == '/')
> 

  reply	other threads:[~2020-10-27 12:59 UTC|newest]

Thread overview: 10+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2020-09-10 15:19 [PATCH 1/4] Sync canonicalize with gnulib [BZ #10635] Adhemerval Zanella
2020-09-10 15:19 ` [PATCH v3 2/4 v2] stdlib: Use fixed buffer size for realpath [BZ #26241] Adhemerval Zanella
2020-10-27 12:59   ` Adhemerval Zanella
2020-09-10 15:19 ` [PATCH 3/4] stdlib: Fix arithmetic overflows in realpath [BZ #26592] Adhemerval Zanella
2020-10-27 12:59   ` Adhemerval Zanella
2020-09-10 15:19 ` [PATCH 4/4] stdlib: Remove lstat usage from realpath [BZ #24970] Adhemerval Zanella
2020-10-27 12:59   ` Adhemerval Zanella [this message]
2020-10-27 12:59 ` [PATCH 1/4] Sync canonicalize with gnulib [BZ #10635] Adhemerval Zanella
2020-10-27 13:15 ` Andreas Schwab
2020-10-27 13:22   ` Adhemerval Zanella

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=227ca5fc-0741-ac67-8417-cb4c19c5f217@linaro.org \
    --to=adhemerval.zanella@linaro.org \
    --cc=libc-alpha@sourceware.org \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for read-only IMAP folder(s) and NNTP newsgroup(s).