Files
findutils/lib/regextype.c
Bernhard Voelker c9c2c51175 regexprops: sort regex_map alphabetically
Commit '1b53838ddf' has changed the order of the nodes, yet not
quite well.  Let's use alphabetical sort order.

* lib/regextype.c (regex_map): Move 'awk' and 'egrep' entries up.
2025-07-09 20:49:51 +02:00

158 lines
4.4 KiB
C

/* regextype.c -- Decode the name of a regular expression syntax into am
option name.
Copyright (C) 2005-2025 Free Software Foundation, Inc.
This program is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program. If not, see <https://www.gnu.org/licenses/>.
*/
/* Written by James Youngman, <jay@gnu.org>. */
/* config.h must be included first. */
#include <config.h>
/* system headers. */
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
/* gnulib headers. */
#include "quote.h"
#include "regex.h"
#include "regextype.h"
#include "xalloc.h"
/* findutils headers */
#include "system.h"
struct tagRegexTypeMap
{
const char *name;
int context;
int option_val;
};
static struct tagRegexTypeMap regex_map[] =
{
{ "findutils-default", CONTEXT_FINDUTILS, RE_SYNTAX_EMACS|RE_DOT_NEWLINE },
{ "awk", CONTEXT_ALL, RE_SYNTAX_AWK },
{ "ed", CONTEXT_GENERIC, RE_SYNTAX_ED },
{ "egrep", CONTEXT_ALL, RE_SYNTAX_EGREP },
{ "emacs", CONTEXT_ALL, RE_SYNTAX_EMACS },
{ "gnu-awk", CONTEXT_ALL, RE_SYNTAX_GNU_AWK },
{ "grep", CONTEXT_ALL, RE_SYNTAX_GREP },
{ "posix-awk", CONTEXT_ALL, RE_SYNTAX_POSIX_AWK },
{ "posix-basic", CONTEXT_ALL, RE_SYNTAX_POSIX_BASIC },
{ "posix-egrep", CONTEXT_ALL, RE_SYNTAX_POSIX_EGREP },
{ "posix-extended", CONTEXT_ALL, RE_SYNTAX_POSIX_EXTENDED },
{ "posix-minimal-basic", CONTEXT_GENERIC, RE_SYNTAX_POSIX_MINIMAL_BASIC },
{ "sed", CONTEXT_GENERIC, RE_SYNTAX_SED },
/* ,{ "posix-common", CONTEXT_GENERIC, _RE_SYNTAX_POSIX_COMMON } */
};
enum { N_REGEX_MAP_ENTRIES = sizeof (regex_map)/sizeof (regex_map[0]) };
int
get_regex_type (const char *s)
{
unsigned i;
size_t msglen;
char *buf, *p;
msglen = 0u;
for (i=0u; i<N_REGEX_MAP_ENTRIES; ++i)
{
if (0 == strcmp (regex_map[i].name, s))
return regex_map[i].option_val;
else
msglen += strlen (quote (regex_map[i].name)) + 2u;
}
/* We didn't find a match for the type of regular expression that the
* user indicated they wanted. Tell them what the options are.
*/
p = buf = xmalloc (1u + msglen);
for (i=0u; i<N_REGEX_MAP_ENTRIES; ++i)
{
if (i > 0u)
{
strcpy (p, ", ");
p += 2;
}
p += sprintf (p, "%s", quote (regex_map[i].name));
}
error (EXIT_FAILURE, 0,
_("Unknown regular expression type %s; valid types are %s."),
quote (s),
buf);
/*NOTREACHED*/
return -1;
}
const char *
get_regex_type_name (unsigned int ix)
{
if (ix < N_REGEX_MAP_ENTRIES)
return regex_map[ix].name;
else
return NULL;
}
int
get_regex_type_flags (unsigned int ix)
{
if (ix < N_REGEX_MAP_ENTRIES)
return regex_map[ix].option_val;
else
return -1;
}
unsigned int get_regex_type_context (unsigned int ix)
{
if (ix < N_REGEX_MAP_ENTRIES)
return regex_map[ix].context;
else
return 0u;
}
int
get_regex_type_synonym (unsigned int ix, unsigned int context)
{
unsigned i;
int flags;
if (ix >= N_REGEX_MAP_ENTRIES)
return -1;
flags = regex_map[ix].option_val;
/* Terminate the loop before we get to IX, so that we always
consistently choose the same entry as a synonym (rather than
stating that x and y are synonyms of each other). */
for (i=0u; i<ix; ++i)
{
if ((regex_map[i].context & context) == 0)
{
/* It is pointless to state that "x is a synonym of y" if we
are not in fact going to include y. */
continue;
}
else if (flags == regex_map[i].option_val)
{
return i;
}
}
return -1;
}