dcd8284393
(to be imported soon).
445 lines
18 KiB
C
445 lines
18 KiB
C
/* Handles parsing the Options provided to the user.
|
|
Copyright (C) 1989 Free Software Foundation, Inc.
|
|
written by Douglas C. Schmidt (schmidt@ics.uci.edu)
|
|
|
|
This file is part of GNU GPERF.
|
|
|
|
GNU GPERF is free software; you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; either version 1, or (at your option)
|
|
any later version.
|
|
|
|
GNU GPERF is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with GNU GPERF; see the file COPYING. If not, write to
|
|
the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA. */
|
|
|
|
#include <stdio.h>
|
|
#include <assert.h>
|
|
#include "options.h"
|
|
#include "iterator.h"
|
|
#include "stderr.h"
|
|
|
|
/* Current program version. */
|
|
extern char *version_string;
|
|
|
|
/* Size to jump on a collision. */
|
|
#define DEFAULT_JUMP_VALUE 5
|
|
|
|
/* Default name for generated lookup function. */
|
|
#define DEFAULT_NAME "in_word_set"
|
|
|
|
/* Default name for the key component. */
|
|
#define DEFAULT_KEY "name"
|
|
|
|
/* Default name for generated hash function. */
|
|
#define DEFAULT_HASH_NAME "hash"
|
|
|
|
/* Globally visible OPTIONS object. */
|
|
OPTIONS option;
|
|
|
|
/* Default delimiters that separate keywords from their attributes. */
|
|
#define DEFAULT_DELIMITERS ",\n"
|
|
|
|
/* Prints program usage to standard error stream. */
|
|
|
|
void
|
|
usage ()
|
|
{
|
|
report_error ("usage: %n [-acCdDef[num]gGhH<hashname>i<init>jk<keys>\
|
|
K<keyname>lnN<name>oprs<size>S<switches>tTv].\n(type %n -h for help)\n");
|
|
}
|
|
|
|
/* Sorts the key positions *IN REVERSE ORDER!!*
|
|
This makes further routines more efficient. Especially when generating code.
|
|
Uses a simple Insertion Sort since the set is probably ordered.
|
|
Returns 1 if there are no duplicates, 0 otherwise. */
|
|
|
|
static int
|
|
key_sort (base, len)
|
|
char *base;
|
|
int len;
|
|
{
|
|
int i, j;
|
|
|
|
for (i = 0, j = len - 1; i < j; i++)
|
|
{
|
|
int curr, tmp;
|
|
|
|
for (curr = i + 1,tmp = base[curr]; curr > 0 && tmp >= base[curr - 1]; curr--)
|
|
if ((base[curr] = base[curr - 1]) == tmp) /* oh no, a duplicate!!! */
|
|
return 0;
|
|
|
|
base[curr] = tmp;
|
|
}
|
|
|
|
return 1;
|
|
}
|
|
|
|
/* Dumps option status when debug is set. */
|
|
|
|
void
|
|
options_destroy ()
|
|
{
|
|
if (OPTION_ENABLED (option, DEBUG))
|
|
{
|
|
char *ptr;
|
|
|
|
fprintf (stderr, "\ndumping Options:\nDEBUG is.......: %s\nORDER is.......: %s\
|
|
\nANSI is........: %s\nTYPE is........: %s\nGNU is.........: %s\nRANDOM is......: %s\
|
|
\nDEFAULTCHARS is: %s\nSWITCH is......: %s\nPOINTER is.....: %s\nNOLENGTH is....: %s\
|
|
\nLENTABLE is....: %s\nDUP is.........: %s\nCOMP is........: %s\nFAST is........: %s\
|
|
\nNOTYPE is......: %s\nGLOBAL is......: %s\nCONST is.......: %s\niterations = %d\
|
|
\nlookup function name = %s\nhash function name = %s\nkey name = %s\
|
|
\njump value = %d\nmax associcated value = %d\ninitial associated value = %d\
|
|
\ndelimiters = %s\nnumber of switch statements = %d\napproximate switch statement size = %d\n",
|
|
OPTION_ENABLED (option, DEBUG) ? "enabled" : "disabled",
|
|
OPTION_ENABLED (option, ORDER) ? "enabled" : "disabled",
|
|
OPTION_ENABLED (option, ANSI) ? "enabled" : "disabled",
|
|
OPTION_ENABLED (option, TYPE) ? "enabled" : "disabled",
|
|
OPTION_ENABLED (option, GNU) ? "enabled" : "disabled",
|
|
OPTION_ENABLED (option, RANDOM) ? "enabled" : "disabled",
|
|
OPTION_ENABLED (option, DEFAULTCHARS) ? "enabled" : "disabled",
|
|
OPTION_ENABLED (option, SWITCH) ? "enabled" : "disabled",
|
|
OPTION_ENABLED (option, POINTER) ? "enabled" : "disabled",
|
|
OPTION_ENABLED (option, NOLENGTH) ? "enabled" : "disabled",
|
|
OPTION_ENABLED (option, LENTABLE) ? "enabled" : "disabled",
|
|
OPTION_ENABLED (option, DUP) ? "enabled" : "disabled",
|
|
OPTION_ENABLED (option, COMP) ? "enabled" : "disabled",
|
|
OPTION_ENABLED (option, FAST) ? "enabled" : "disabled",
|
|
OPTION_ENABLED (option, NOTYPE) ? "enabled" : "disabled",
|
|
OPTION_ENABLED (option, GLOBAL) ? "enabled" : "disabled",
|
|
OPTION_ENABLED (option, CONST) ? "enabled" : "disabled",
|
|
option.iterations, option.function_name, option.hash_name,
|
|
option.key_name, option.jump, option.size - 1,
|
|
option.initial_asso_value, option.delimiters, option.total_switches,
|
|
keyword_list_length () / option.total_switches);
|
|
|
|
if (OPTION_ENABLED (option, ALLCHARS))
|
|
fprintf (stderr, "all characters are used in the hash function\n");
|
|
fprintf (stderr, "maximum charset size = %d\nkey positions are: \n",
|
|
option.total_charset_size);
|
|
|
|
for (ptr = option.key_positions; *ptr != EOS; ptr++)
|
|
if (*ptr == WORD_END)
|
|
fprintf (stderr, "$\n");
|
|
else
|
|
fprintf (stderr, "%d\n", *ptr);
|
|
|
|
fprintf (stderr, "finished dumping Options\n");
|
|
}
|
|
}
|
|
|
|
/* Parses the command line Options and sets appropriate flags in option.option_word. */
|
|
|
|
void
|
|
options_init (argc, argv)
|
|
int argc;
|
|
char *argv[];
|
|
{
|
|
extern int optind;
|
|
extern char *optarg;
|
|
int option_char;
|
|
|
|
option.key_positions[0] = WORD_START;
|
|
option.key_positions[1] = WORD_END;
|
|
option.key_positions[2] = EOS;
|
|
option.total_charset_size = 2;
|
|
option.jump = DEFAULT_JUMP_VALUE;
|
|
option.option_word = (int) DEFAULTCHARS;
|
|
option.function_name = DEFAULT_NAME;
|
|
option.hash_name = DEFAULT_HASH_NAME;
|
|
option.key_name = DEFAULT_KEY;
|
|
option.delimiters = DEFAULT_DELIMITERS;
|
|
option.initial_asso_value = option.size = option.iterations = 0;
|
|
option.total_switches = 1;
|
|
option.argument_count = argc;
|
|
option.argument_vector = argv;
|
|
set_program_name (argv[0]);
|
|
|
|
while ((option_char = getopt (argc, argv, "adcCDe:f:gGhH:i:j:k:K:lnN:oprs:S:tTv")) != EOF)
|
|
{
|
|
switch (option_char)
|
|
{
|
|
case 'a': /* Generated coded uses the ANSI prototype format. */
|
|
{
|
|
SET_OPTION (option, ANSI);
|
|
break;
|
|
}
|
|
case 'c': /* Generate strncmp rather than strcmp. */
|
|
{
|
|
SET_OPTION (option, COMP);
|
|
break;
|
|
}
|
|
case 'C': /* Make the generated tables readonly (const). */
|
|
{
|
|
SET_OPTION (option, CONST);
|
|
break;
|
|
}
|
|
case 'd': /* Enable debugging option. */
|
|
{
|
|
SET_OPTION (option, DEBUG);
|
|
report_error ("starting program %n, version %s, with debuggin on.\n",
|
|
version_string);
|
|
break;
|
|
}
|
|
case 'D': /* Enable duplicate option. */
|
|
{
|
|
SET_OPTION (option, DUP);
|
|
break;
|
|
}
|
|
case 'e': /* Allows user to provide keyword/attribute separator */
|
|
{
|
|
SET_DELIMITERS (option, optarg);
|
|
break;
|
|
}
|
|
case 'f': /* Generate the hash table ``fast.'' */
|
|
{
|
|
SET_OPTION (option, FAST);
|
|
if ((option.iterations = atoi (optarg)) < 0)
|
|
{
|
|
report_error ("iterations value must not be negative, assuming 0\n");
|
|
option.iterations = 0;
|
|
}
|
|
break;
|
|
}
|
|
case 'g': /* Use the ``inline'' keyword for generated sub-routines. */
|
|
{
|
|
SET_OPTION (option, GNU);
|
|
break;
|
|
}
|
|
case 'G': /* Make the keyword table a global variable. */
|
|
{
|
|
SET_OPTION (option, GLOBAL);
|
|
break;
|
|
}
|
|
case 'h': /* Displays a list of helpful Options to the user. */
|
|
{
|
|
report_error (
|
|
"-a\tGenerate ANSI standard C output code, i.e., function prototypes.\n\
|
|
-c\tGenerate comparison code using strncmp rather than strcmp.\n\
|
|
-C\tMake the contents of generated lookup tables constant, i.e., readonly.\n\
|
|
-d\tEnables the debugging option (produces verbose output to Std_Err).\n\
|
|
-D\tHandle keywords that hash to duplicate values. This is useful\n\
|
|
\tfor certain highly redundant keyword sets. It enables the -S option.\n\
|
|
-e\tAllow user to provide a string containing delimiters used to separate\n\
|
|
\tkeywords from their attributes. Default is \",\\n\"\n\
|
|
-f\tGenerate the perfect hash function ``fast.'' This decreases GPERF's\n\
|
|
\trunning time at the cost of minimizing generated table-size.\n\
|
|
\tThe numeric argument represents the number of times to iterate when\n\
|
|
\tresolving a collision. `0' means ``iterate by the number of keywords''.\n\
|
|
-g\tAssume a GNU compiler, e.g., g++ or gcc. This makes all generated\n\
|
|
\troutines use the ``inline'' keyword to remove cost of function calls.\n\
|
|
-G\tGenerate the static table of keywords as a static global variable,\n\
|
|
\trather than hiding it inside of the lookup function (which is the\n\
|
|
\tdefault behavior).\n\
|
|
-h\tPrints this mesage.\n");
|
|
report_error (
|
|
"-H\tAllow user to specify name of generated hash function. Default is `hash'.\n\
|
|
-i\tProvide an initial value for the associate values array. Default is 0.\n\
|
|
\tSetting this value larger helps inflate the size of the final table.\n\
|
|
-j\tAffects the ``jump value,'' i.e., how far to advance the associated\n\
|
|
\tcharacter value upon collisions. Must be an odd number, default is %d.\n\
|
|
-k\tAllows selection of the key positions used in the hash function.\n\
|
|
\tThe allowable choices range between 1-%d, inclusive. The positions\n\
|
|
\tare separated by commas, ranges may be used, and key positions may\n\
|
|
\toccur in any order. Also, the meta-character '*' causes the generated\n\
|
|
\thash function to consider ALL key positions, and $ indicates the\n\
|
|
\t``final character'' of a key, e.g., $,1,2,4,6-10.\n\
|
|
-K\tAllow user to select name of the keyword component in the keyword structure.\n\
|
|
-l\tCompare key lengths before trying a string comparison. This helps\n\
|
|
\tcut down on the number of string comparisons made during the lookup.\n\
|
|
-n\tDo not include the length of the keyword when computing the hash function\n\
|
|
-N\tAllow user to specify name of generated lookup function. Default\n\
|
|
\tname is `in_word_set.'\n\
|
|
-o\tReorders input keys by frequency of occurrence of the key sets.\n\
|
|
\tThis should decrease the search time dramatically.\n\
|
|
-p\tChanges the return value of the generated function ``in_word_set''\n\
|
|
\tfrom its default boolean value (i.e., 0 or 1), to type ``pointer\n\
|
|
\tto wordlist array'' This is most useful when the -t option, allowing\n\
|
|
\tuser-defined structs, is used.\n",
|
|
DEFAULT_JUMP_VALUE, MAX_KEY_POS - 1);
|
|
report_error (
|
|
"-r\tUtilizes randomness to initialize the associated values table.\n\
|
|
-s\tAffects the size of the generated hash table. The numeric argument\n\
|
|
\tfor this option indicates ``how many times larger'' the table range\n\
|
|
\tshould be, in relationship to the number of keys, e.g. a value of 3\n\
|
|
\tmeans ``make the table about 3 times larger than the number of input\n\
|
|
\tkeys.'' A larger table should decrease the time required for an\n\
|
|
\tunsuccessful search, at the expense of extra table space. Default\n\
|
|
\tvalue is 1. This actual table size may vary somewhat.\n\
|
|
-S\tCauses the generated C code to use a switch statement scheme, rather\n\
|
|
\tthan an array lookup table. This can lead to a reduction in both\n\
|
|
\ttime and space requirements for some keyfiles. The argument to\n\
|
|
\tthis option determines how many switch statements are generated.\n\
|
|
\tA value of 1 generates 1 switch containing all the elements, a value of 2\n\
|
|
\tgenerates 2 tables with 1/2 the elements in each table, etc. This\n\
|
|
\tis useful since many C compilers cannot correctly generate code for\n\
|
|
\tlarge switch statements.\n\
|
|
\tthe expense of longer time for each lookup. Mostly important for\n\
|
|
\t*large* input sets, i.e., greater than around 100 items or so.\n\
|
|
-t\tAllows the user to include a structured type declaration for \n\
|
|
\tgenerated code. Any text before %%%% is consider part of the type\n\
|
|
\tdeclaration. Key words and additional fields may follow this, one\n\
|
|
\tgroup of fields per line.\n\
|
|
-T\tPrevents the transfer of the type declaration to the output file.\n\
|
|
\tUse this option if the type is already defined elsewhere.\n\
|
|
-v\tPrints out the current version number\n%e%a\n",
|
|
usage);
|
|
}
|
|
case 'H': /* Sets the name for the hash function */
|
|
{
|
|
option.hash_name = optarg;
|
|
break;
|
|
}
|
|
case 'i': /* Sets the initial value for the associated values array. */
|
|
{
|
|
if ((option.initial_asso_value = atoi (optarg)) < 0)
|
|
report_error ("initial value %d must be non-zero, ignoring and continuing\n",
|
|
option.initial_asso_value);
|
|
if (OPTION_ENABLED (option, RANDOM))
|
|
report_error ("warning, -r option superceeds -i, ignoring -i option and continuing\n");
|
|
break;
|
|
}
|
|
case 'j': /* Sets the jump value, must be odd for later algorithms. */
|
|
{
|
|
if ((option.jump = atoi (optarg)) < 0)
|
|
report_error ("jump value %d must be a positive number\n%e%a",
|
|
option.jump, usage);
|
|
else if (option.jump && EVEN (option.jump))
|
|
report_error ("jump value %d should be odd, adding 1 and continuing...\n",
|
|
option.jump++);
|
|
break;
|
|
}
|
|
case 'k': /* Sets key positions used for hash function. */
|
|
{
|
|
int BAD_VALUE = -1;
|
|
int value;
|
|
|
|
iterator_init (optarg, 1, MAX_KEY_POS - 1, WORD_END, BAD_VALUE, EOS);
|
|
|
|
if (*optarg == '*') /* Use all the characters for hashing!!!! */
|
|
{
|
|
UNSET_OPTION (option, DEFAULTCHARS);
|
|
SET_OPTION (option, ALLCHARS);
|
|
}
|
|
else
|
|
{
|
|
char *key_pos;
|
|
|
|
for (key_pos = option.key_positions; (value = next ()) != EOS; key_pos++)
|
|
if (value == BAD_VALUE)
|
|
report_error ("illegal key value or range, use 1,2,3-%d,'$' or '*'.\n%e%a",
|
|
(MAX_KEY_POS - 1),usage);
|
|
else
|
|
*key_pos = value;;
|
|
|
|
*key_pos = EOS;
|
|
|
|
if (! (option.total_charset_size = (key_pos - option.key_positions)))
|
|
report_error ("no keys selected\n%e%a", usage);
|
|
else if (! key_sort (option.key_positions, option.total_charset_size))
|
|
report_error ("duplicate keys selected\n%e%a", usage);
|
|
|
|
if (option.total_charset_size != 2
|
|
|| (option.key_positions[0] != 1 || option.key_positions[1] != WORD_END))
|
|
UNSET_OPTION (option, DEFAULTCHARS);
|
|
}
|
|
break;
|
|
}
|
|
case 'K': /* Make this the keyname for the keyword component field. */
|
|
{
|
|
option.key_name = optarg;
|
|
break;
|
|
}
|
|
case 'l': /* Create length table to avoid extra string compares. */
|
|
{
|
|
SET_OPTION (option, LENTABLE);
|
|
break;
|
|
}
|
|
case 'n': /* Don't include the length when computing hash function. */
|
|
{
|
|
SET_OPTION (option, NOLENGTH);
|
|
break;
|
|
}
|
|
case 'N': /* Make generated lookup function name be optarg */
|
|
{
|
|
option.function_name = optarg;
|
|
break;
|
|
}
|
|
case 'o': /* Order input by frequency of key set occurrence. */
|
|
{
|
|
SET_OPTION (option, ORDER);
|
|
break;
|
|
}
|
|
case 'p': /* Generated lookup function now a pointer instead of int. */
|
|
{
|
|
SET_OPTION (option, POINTER);
|
|
break;
|
|
}
|
|
case 'r': /* Utilize randomness to initialize the associated values table. */
|
|
{
|
|
SET_OPTION (option, RANDOM);
|
|
if (option.initial_asso_value != 0)
|
|
report_error ("warning, -r option superceeds -i, disabling -i option and continuing\n");
|
|
break;
|
|
}
|
|
case 's': /* Range of associated values, determines size of final table. */
|
|
{
|
|
if ((option.size = atoi (optarg)) <= 0)
|
|
report_error ("improper range argument %s\n%e%a", optarg, usage);
|
|
else if (option.size > 50)
|
|
report_error ("%d is excessive, did you really mean this?! (type %n -h for help)\n",
|
|
option.size);
|
|
break;
|
|
}
|
|
case 'S': /* Generate switch statement output, rather than lookup table. */
|
|
{
|
|
SET_OPTION (option, SWITCH);
|
|
if ((option.total_switches = atoi (optarg)) <= 0)
|
|
report_error ("number of switches %s must be a positive number\n%e%a", optarg, usage);
|
|
break;
|
|
}
|
|
case 't': /* Enable the TYPE mode, allowing arbitrary user structures. */
|
|
{
|
|
SET_OPTION (option, TYPE);
|
|
break;
|
|
}
|
|
case 'T': /* Don't print structure definition. */
|
|
{
|
|
SET_OPTION (option, NOTYPE);
|
|
break;
|
|
}
|
|
case 'v': /* Print out the version and quit. */
|
|
report_error ("%n: version %s\n%e%a\n", version_string, usage);
|
|
default:
|
|
report_error ("%e%a", usage);
|
|
}
|
|
}
|
|
|
|
if (argv[optind] && ! freopen (argv[optind], "r", stdin))
|
|
report_error ("unable to read key word file %s\n%e%a", argv[optind], usage);
|
|
|
|
if (++optind < argc)
|
|
report_error ("extra trailing arguments to %n\n%e%a", usage);
|
|
}
|
|
|
|
/* Output command-line Options. */
|
|
void
|
|
print_options ()
|
|
{
|
|
int i;
|
|
|
|
printf ("/* Command-line: ");
|
|
|
|
for (i = 0; i < option.argument_count; i++)
|
|
printf ("%s ", option.argument_vector[i]);
|
|
|
|
printf (" */\n\n");
|
|
}
|
|
|