From: Adhemerval Zanella Netto <adhemerval.zanella@linaro.org>
To: Wilco Dijkstra <Wilco.Dijkstra@arm.com>,
'GNU C Library' <libc-alpha@sourceware.org>
Subject: Re: [PATCH] Benchtests: Remove simple_strcspn/strpbrk/strsep
Date: Wed, 8 Mar 2023 12:24:01 -0300 [thread overview]
Message-ID: <5ff76fc9-e40e-4a1e-71e2-a683a31f9b62@linaro.org> (raw)
In-Reply-To: <PAWPR08MB8982522B5EE5567FD55710B583B49@PAWPR08MB8982.eurprd08.prod.outlook.com>
On 08/03/23 08:05, Wilco Dijkstra via Libc-alpha wrote:
>
> Remove simple_strcspn/strpbrk/strsep which are significantly slower than the generic
> implementations. Also remove oldstrsep and oldstrtok since they are practically identical
> to the generic implementation. Adjust iteration count to reduce benchmark time.
LGTM, thanks.
Reviewed-by: Adhemerval Zanella <adhemerval.zanella@linaro.org>
>
> ---
>
> diff --git a/benchtests/bench-strcspn.c b/benchtests/bench-strcspn.c
> index 2388f33d5441b302ffe34a9bb4ee7ed70db7306b..fa74d305ae66c8f220b2f35d8733520a62a84968 100644
> --- a/benchtests/bench-strcspn.c
> +++ b/benchtests/bench-strcspn.c
> @@ -26,29 +26,8 @@
> #endif /* WIDE */
> #include "bench-string.h"
>
> -#ifndef WIDE
> -# define SIMPLE_STRCSPN simple_strcspn
> -#else
> -# define SIMPLE_STRCSPN simple_wcscspn
> -#endif /* WIDE */
> -
> typedef size_t (*proto_t) (const CHAR *, const CHAR *);
> -size_t SIMPLE_STRCSPN (const CHAR *, const CHAR *);
>
> -IMPL (SIMPLE_STRCSPN, 0)
> IMPL (STRCSPN, 1)
>
> -size_t
> -SIMPLE_STRCSPN (const CHAR *s, const CHAR *rej)
> -{
> - const CHAR *r, *str = s;
> - CHAR c;
> -
> - while ((c = *s++) != '\0')
> - for (r = rej; *r != '\0'; ++r)
> - if (*r == c)
> - return s - str - 1;
> - return s - str - 1;
> -}
> -
> #include "bench-strpbrk.c"
> diff --git a/benchtests/bench-strpbrk.c b/benchtests/bench-strpbrk.c
> index e96fb0efbf06fcb6c329917f73a90149d2bcb944..55199b73c9233bcedf52bd8e45dca628371c2803 100644
> --- a/benchtests/bench-strpbrk.c
> +++ b/benchtests/bench-strpbrk.c
> @@ -35,31 +35,10 @@
> # endif /* WIDE */
> # include "bench-string.h"
>
> -# ifndef WIDE
> -# define SIMPLE_STRPBRK simple_strpbrk
> -# else
> -# define SIMPLE_STRPBRK simple_wcspbrk
> -# endif /* WIDE */
> -
> typedef CHAR *(*proto_t) (const CHAR *, const CHAR *);
> -CHAR *SIMPLE_STRPBRK (const CHAR *, const CHAR *);
>
> -IMPL (SIMPLE_STRPBRK, 0)
> IMPL (STRPBRK, 1)
>
> -CHAR *
> -SIMPLE_STRPBRK (const CHAR *s, const CHAR *rej)
> -{
> - const CHAR *r;
> - CHAR c;
> -
> - while ((c = *s++) != '\0')
> - for (r = rej; *r != '\0'; ++r)
> - if (*r == c)
> - return (CHAR *) s - 1;
> - return NULL;
> -}
> -
> #endif /* !STRPBRK_RESULT */
>
> #include "json-lib.h"
> @@ -69,7 +48,7 @@ do_one_test (json_ctx_t *json_ctx, impl_t *impl, const CHAR *s,
> const CHAR *rej, RES_TYPE exp_res)
> {
> RES_TYPE res = CALL (impl, s, rej);
> - size_t i, iters = INNER_LOOP_ITERS;
> + size_t i, iters = INNER_LOOP_ITERS8 / CHARBYTES;
> timing_t start, stop, cur;
>
> if (res != exp_res)
> diff --git a/benchtests/bench-strsep.c b/benchtests/bench-strsep.c
> index 4b203aff30db1592120db5f0b39b06a6e9cd4a13..d7df3fa0a9aae04918ad54fc7927a1da18ceb402 100644
> --- a/benchtests/bench-strsep.c
> +++ b/benchtests/bench-strsep.c
> @@ -20,90 +20,14 @@
> #define TEST_NAME "strsep"
> #include "bench-string.h"
>
> -char *
> -simple_strsep (char **s1, char *s2)
> -{
> - char *begin;
> - char *s;
> - size_t j = 0;
> -
> - begin = *s1;
> - s = begin;
> - if (begin == NULL)
> - return NULL;
> - ssize_t s2len = strlen (s2);
> - while (*s)
> - {
> - for (j = 0; j < s2len; j++)
> - {
> - if (*s == s2[j])
> - {
> - s[0] = '\0';
> - *s1 = s + 1;
> - return begin;
> - }
> - }
> - s++;
> - }
> - *s1 = NULL;
> - return begin;
> -}
> -
> -char *
> -oldstrsep (char **stringp, const char *delim)
> -{
> - char *begin, *end;
> -
> - begin = *stringp;
> - if (begin == NULL)
> - return NULL;
> -
> - /* A frequent case is when the delimiter string contains only one
> - character. Here we don't need to call the expensive `strpbrk'
> - function and instead work using `strchr'. */
> - if (delim[0] == '\0' || delim[1] == '\0')
> - {
> - char ch = delim[0];
> -
> - if (ch == '\0')
> - end = NULL;
> - else
> - {
> - if (*begin == ch)
> - end = begin;
> - else if (*begin == '\0')
> - end = NULL;
> - else
> - end = strchr (begin + 1, ch);
> - }
> - }
> - else
> - /* Find the end of the token. */
> - end = strpbrk (begin, delim);
> -
> - if (end)
> - {
> - /* Terminate the token and set *STRINGP past NUL character. */
> - *end++ = '\0';
> - *stringp = end;
> - }
> - else
> - /* No more delimiters; this is the last token. */
> - *stringp = NULL;
> -
> - return begin;
> -}
> -
> typedef char *(*proto_t) (const char **, const char *);
>
> -IMPL (simple_strsep, 0)
> IMPL (strsep, 1)
> -IMPL (oldstrsep, 2)
>
> static void
> do_one_test (impl_t * impl, const char *s1, const char *s2)
> {
> - size_t i, iters = INNER_LOOP_ITERS_SMALL;
> + size_t i, iters = INNER_LOOP_ITERS;
> timing_t start, stop, cur;
>
> TIMING_NOW (start);
> diff --git a/benchtests/bench-strspn.c b/benchtests/bench-strspn.c
> index 707613cbcf5ac556e6d5a0c3a95c19be1dcadfc6..cc98ffb38bd5d7085efa8c1d1fb7aba6c46c1b3f 100644
> --- a/benchtests/bench-strspn.c
> +++ b/benchtests/bench-strspn.c
> @@ -28,41 +28,20 @@
> #define BIG_CHAR MAX_CHAR
>
> #ifndef WIDE
> -# define SIMPLE_STRSPN simple_strspn
> # define SMALL_CHAR 127
> #else
> -# define SIMPLE_STRSPN simple_wcsspn
> # define SMALL_CHAR 1273
> #endif /* WIDE */
>
> typedef size_t (*proto_t) (const CHAR *, const CHAR *);
> -size_t SIMPLE_STRSPN (const CHAR *, const CHAR *);
>
> -IMPL (SIMPLE_STRSPN, 0)
> IMPL (STRSPN, 1)
>
> -size_t
> -SIMPLE_STRSPN (const CHAR *s, const CHAR *acc)
> -{
> - const CHAR *r, *str = s;
> - CHAR c;
> -
> - while ((c = *s++) != '\0')
> - {
> - for (r = acc; *r != '\0'; ++r)
> - if (*r == c)
> - break;
> - if (*r == '\0')
> - return s - str - 1;
> - }
> - return s - str - 1;
> -}
> -
> static void
> do_one_test (json_ctx_t *json_ctx, impl_t *impl, const CHAR *s,
> const CHAR *acc, size_t exp_res)
> {
> - size_t res = CALL (impl, s, acc), i, iters = INNER_LOOP_ITERS;
> + size_t res = CALL (impl, s, acc), i, iters = INNER_LOOP_ITERS8 / CHARBYTES;
> timing_t start, stop, cur;
>
> if (res != exp_res)
> diff --git a/benchtests/bench-strtok.c b/benchtests/bench-strtok.c
> index 711bdaab58ff297855b03d62057cefd066f4e1c5..b5789d7bf243c40810f38efd40f0bb9c870327ca 100644
> --- a/benchtests/bench-strtok.c
> +++ b/benchtests/bench-strtok.c
> @@ -20,47 +20,14 @@
> #define TEST_NAME "strtok"
> #include "bench-string.h"
>
> -char *
> -oldstrtok (char *s, const char *delim)
> -{
> - static char *olds;
> - char *token;
> -
> - if (s == NULL)
> - s = olds;
> -
> - /* Scan leading delimiters. */
> - s += strspn (s, delim);
> - if (*s == '\0')
> - {
> - olds = s;
> - return NULL;
> - }
> -
> - /* Find the end of the token. */
> - token = s;
> - s = strpbrk (token, delim);
> - if (s == NULL)
> - /* This token finishes the string. */
> - olds = strchr (token, '\0');
> - else
> - {
> - /* Terminate the token and make OLDS point past it. */
> - *s = '\0';
> - olds = s + 1;
> - }
> - return token;
> -}
> -
> typedef char *(*proto_t) (const char *, const char *);
>
> -IMPL (oldstrtok, 0)
> IMPL (strtok, 1)
>
> static void
> do_one_test (impl_t * impl, const char *s1, const char *s2)
> {
> - size_t i, iters = INNER_LOOP_ITERS_SMALL;
> + size_t i, iters = INNER_LOOP_ITERS_MEDIUM;
> timing_t start, stop, cur;
> TIMING_NOW (start);
> for (i = 0; i < iters; ++i)
> @@ -74,7 +41,6 @@ do_one_test (impl_t * impl, const char *s1, const char *s2)
> TIMING_DIFF (cur, start, stop);
>
> TIMING_PRINT_MEAN ((double) cur, (double) iters);
> -
> }
>
>
>
prev parent reply other threads:[~2023-03-08 15:24 UTC|newest]
Thread overview: 2+ messages / expand[flat|nested] mbox.gz Atom feed top
2023-03-08 11:05 Wilco Dijkstra
2023-03-08 15:24 ` Adhemerval Zanella Netto [this message]
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=5ff76fc9-e40e-4a1e-71e2-a683a31f9b62@linaro.org \
--to=adhemerval.zanella@linaro.org \
--cc=Wilco.Dijkstra@arm.com \
--cc=libc-alpha@sourceware.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for read-only IMAP folder(s) and NNTP newsgroup(s).