diff options
| author | Francesco Potortì <pot@gnu.org> | 1999-11-01 02:48:57 +0000 | 
|---|---|---|
| committer | Francesco Potortì <pot@gnu.org> | 1999-11-01 02:48:57 +0000 | 
| commit | 93b7ac65fc0e920bf11262f6b3eba4ae65c7a114 (patch) | |
| tree | db580d73a45abb863610aa6c3d0117a6d24abd2e /lib-src | |
| parent | 1c4784614ed4beda8e488308709c5486ea5740d8 (diff) | |
| download | emacs-93b7ac65fc0e920bf11262f6b3eba4ae65c7a114.tar.gz | |
Checked in at last a lot of improvementes and bug fixes.  The oldest dating
back to 1997-06-04.  Please look at Changelog for details.  Main changes
are:
- lots of code cleanups and optimizations
- --globals is used not only for C-like languages
- new option --ignore-case-regex
- understands "operator" in C++
- support DOS file names by handling e.g. foo.cgz as if it were foo.c.gz.
- Fortran: no tags for "procedure"
- new option --declarations
- regular expressions can be read from a file
- regular expressions can be bound to a given language
- Ada and Python languages added
- my and local variables recognised in Perl
- "(defstruct (foo", "(defun (operator" and similar Lisp constructs
- interface in Java
Diffstat (limited to 'lib-src')
| -rw-r--r-- | lib-src/etags.c | 2404 | 
1 files changed, 1492 insertions, 912 deletions
| diff --git a/lib-src/etags.c b/lib-src/etags.c index 83a9f65f6ca..165c298f0da 100644 --- a/lib-src/etags.c +++ b/lib-src/etags.c @@ -31,11 +31,12 @@ Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. */   *	Francesco Potorti` (F.Potorti@cnuce.cnr.it) is the current maintainer.   */ -char pot_etags_version[] = "@(#) pot revision number is 12.11"; +char pot_etags_version[] = "@(#) pot revision number is 13.31";  #define	TRUE	1  #define	FALSE	0 +#define _GNU_SOURCE		/* enables some compiler checks on GNU */  #ifndef DEBUG  # define DEBUG FALSE  #endif @@ -45,14 +46,18 @@ char pot_etags_version[] = "@(#) pot revision number is 12.11";    /* On some systems, Emacs defines static as nothing for the sake       of unexec.  We don't want that here since we don't use unexec. */  # undef static -# define ETAGS_REGEXPS -# define LONG_OPTIONS -#endif +# define ETAGS_REGEXPS		/* use the regexp features */ +# define LONG_OPTIONS		/* accept long options */ +#endif /* HAVE_CONFIG_H */  #ifdef MSDOS -# include <string.h>  # include <fcntl.h>  # include <sys/param.h> +# include <io.h> +# ifndef HAVE_CONFIG_H +#   define DOS_NT +#   include <sys/config.h> +# endif  #endif /* MSDOS */  #ifdef WINDOWSNT @@ -61,27 +66,38 @@ char pot_etags_version[] = "@(#) pot revision number is 12.11";  # include <string.h>  # include <io.h>  # define MAXPATHLEN _MAX_PATH -#endif - -#if !defined (MSDOS) && !defined (WINDOWSNT) && defined (STDC_HEADERS) +# ifdef HAVE_CONFIG_H +#   undef HAVE_NTGUI +# else +#   define DOS_NT +# endif /* not HAVE_CONFIG_H */ +# ifndef HAVE_GETCWD +#   define HAVE_GETCWD +# endif /* undef HAVE_GETCWD */ +#endif /* WINDOWSNT */ + +#if !defined (WINDOWSNT) && defined (STDC_HEADERS)  #include <stdlib.h>  #include <string.h>  #endif +#ifdef HAVE_UNISTD_H +# include <unistd.h> +#else +# ifdef HAVE_GETCWD +    extern char *getcwd (); +# endif +#endif /* HAVE_UNISTD_H */ +  #include <stdio.h>  #include <ctype.h>  #include <errno.h>  #ifndef errno -extern int errno; +  extern int errno;  #endif  #include <sys/types.h>  #include <sys/stat.h> -/* This is to declare getcwd.  */ -#ifdef HAVE_UNISTD_H -#include <unistd.h> -#endif -  #if !defined (S_ISREG) && defined (S_IFREG)  # define S_ISREG(m)	(((m) & S_IFMT) == S_IFREG)  #endif @@ -131,62 +147,55 @@ extern int errno;  #define lowcase(c)	tolower ((char)c)  #define CHARS 256		/* 2^sizeof(char) */ -#define CHAR(x)		((int)x & (CHARS - 1)) +#define CHAR(x)		((unsigned int)x & (CHARS - 1))  #define	iswhite(c)	(_wht[CHAR(c)]) /* c is white */  #define notinname(c)	(_nin[CHAR(c)]) /* c is not in a name */  #define	begtoken(c)	(_btk[CHAR(c)]) /* c can start token */  #define	intoken(c)	(_itk[CHAR(c)]) /* c can be in token */  #define	endtoken(c)	(_etk[CHAR(c)]) /* c ends tokens */ -#ifdef DOS_NT -# define absolutefn(fn) (fn[0] == '/' \ -			 || (fn[1] == ':' && fn[2] == '/')) -#else -# define absolutefn(fn) (fn[0] == '/') -#endif -  /* - *	xnew -- allocate storage + *	xnew, xrnew -- allocate, reallocate storage   *   * SYNOPSIS:	Type *xnew (int n, Type); + *		Type *xrnew (OldPointer, int n, Type);   */  #ifdef chkmalloc  # include "chkmalloc.h" -# define xnew(n,Type)	((Type *) trace_xmalloc (__FILE__, __LINE__, \ -						 (n) * sizeof (Type))) +# define xnew(n,Type)	  ((Type *) trace_malloc (__FILE__, __LINE__, \ +						  (n) * sizeof (Type))) +# define xrnew(op,n,Type) ((Type *) trace_realloc (__FILE__, __LINE__, \ +						   (op), (n) * sizeof (Type)))  #else -# define xnew(n,Type)	((Type *) xmalloc ((n) * sizeof (Type))) +# define xnew(n,Type)	  ((Type *) xmalloc ((n) * sizeof (Type))) +# define xrnew(op,n,Type) ((Type *) xrealloc ((op), (n) * sizeof (Type)))  #endif  typedef int bool; -typedef struct nd_st -{				/* sorting structure		*/ -  char *name;			/* function or type name	*/ -  char *file;			/* file name			*/ -  bool is_func;			/* use pattern or line no	*/ -  bool been_warned;		/* set if noticed dup		*/ -  int lno;			/* line number tag is on	*/ -  long cno;			/* character number line starts on */ -  char *pat;			/* search pattern		*/ -  struct nd_st *left, *right;	/* left and right sons		*/ -} NODE; +typedef void Lang_function (); -extern char *getenv (); +typedef struct +{ +  char *suffix; +  char *command;		/* Takes one arg and decompresses to stdout */ +} compressor; -char *concat (); -char *savenstr (), *savestr (); -char *etags_strchr (), *etags_strrchr (); -char *etags_getcwd (); -char *relative_filename (), *absolute_filename (), *absolute_dirname (); -void grow_linebuffer (); -long *xmalloc (), *xrealloc (); +typedef struct +{ +  char *name; +  Lang_function *function; +  char **suffixes; +  char **interpreters; +} language; + +extern char *getenv (); -typedef void Lang_function ();  /* Many compilers barf on this: -	Lang_function Asm_labels; +	Lang_function Ada_funcs;     so let's write it this way */ +void Ada_funcs ();  void Asm_labels ();  void C_entries ();  void default_C_entries (); @@ -203,81 +212,111 @@ void Pascal_functions ();  void Perl_functions ();  void Postscript_functions ();  void Prolog_functions (); +void Python_functions ();  void Scheme_functions ();  void TeX_functions ();  void just_read_file (); -Lang_function *get_language_from_name (); -Lang_function *get_language_from_interpreter (); -Lang_function *get_language_from_suffix (); +compressor *get_compressor_from_suffix (); +language *get_language_from_name (); +language *get_language_from_interpreter (); +language *get_language_from_suffix ();  int total_size_of_entries (); -long readline (); -long readline_internal (); +long readline (), readline_internal (); +void get_tag (); +  #ifdef ETAGS_REGEXPS  void analyse_regex ();  void add_regex (); +void free_patterns ();  #endif /* ETAGS_REGEXPS */ -void add_node ();  void error ();  void suggest_asking_for_help ();  void fatal (), pfatal (); -void find_entries (); -void free_tree (); -void getit (); +void add_node (); +  void init ();  void initbuffer (); +void find_entries (); +void free_tree ();  void pfnote (), new_pfnote ();  void process_file ();  void put_entries ();  void takeprec (); +char *concat (); +char *skip_spaces (), *skip_non_spaces (); +char *savenstr (), *savestr (); +char *etags_strchr (), *etags_strrchr (); +char *etags_getcwd (); +char *relative_filename (), *absolute_filename (), *absolute_dirname (); +bool filename_is_absolute (); +void canonicalize_filename (); +void grow_linebuffer (); +long *xmalloc (), *xrealloc (); +  char searchar = '/';		/* use /.../ searches */ -int lineno;			/* line number of current line */ -long charno;			/* current character number */ -long linecharno;		/* charno of start of line */ - -char *curfile;			/* current input file name */  char *tagfile;			/* output file */  char *progname;			/* name this program was invoked with */  char *cwd;			/* current working directory */  char *tagfiledir;		/* directory of tagfile */ -  FILE *tagf;			/* ioptr for tags file */ -NODE *head;			/* the head of the binary tree of tags */ + +char *curfile;			/* current input file name */ +language *curlang;		/* current language */ + +int lineno;			/* line number of current line */ +long charno;			/* current character number */ +long linecharno;		/* charno of start of current line */ +char *dbp;			/* pointer to start of current tag */ + +typedef struct node_st +{				/* sorting structure		*/ +  char *name;			/* function or type name	*/ +  char *file;			/* file name			*/ +  bool is_func;			/* use pattern or line no	*/ +  bool been_warned;		/* set if noticed dup		*/ +  int lno;			/* line number tag is on	*/ +  long cno;			/* character number line starts on */ +  char *pat;			/* search pattern		*/ +  struct node_st *left, *right;	/* left and right sons		*/ +} node; + +node *head;			/* the head of the binary tree of tags */  /* - * A `struct linebuffer' is a structure which holds a line of text. - * `readline' reads a line from a stream into a linebuffer and works - * regardless of the length of the line. + * A `linebuffer' is a structure which holds a line of text. + * `readline_internal' reads a line from a stream into a linebuffer + * and works regardless of the length of the line.   * SIZE is the size of BUFFER, LEN is the length of the string in   * BUFFER after readline reads it.   */ -struct linebuffer +typedef struct  {    long size;    int len;    char *buffer; -}; +} linebuffer; -struct linebuffer lb;		/* the current line */ -struct linebuffer token_name;	/* used by C_entries as a temporary area */ +linebuffer lb;			/* the current line */ +linebuffer token_name;		/* used by C_entries as a temporary area */  struct  {    long linepos; -  struct linebuffer lb;		/* used by C_entries instead of lb */ +  linebuffer lb;		/* used by C_entries instead of lb */  } lbs[2];  /* boolean "functions" (see init)	*/  bool _wht[CHARS], _nin[CHARS], _itk[CHARS], _btk[CHARS], _etk[CHARS];  char    /* white chars */ -  *white = " \f\t\n\013", +  *white = " \f\t\n\r",    /* not in a name */ -  *nonam =" \f\t\n\013(=,[;", +  *nonam = " \f\t\n\r(=,[;",    /* token ending chars */ -  *endtk = " \t\n\013\"'#()[]{}=-+%*/&|^~!<>;,.:?", +  *endtk = " \t\n\r\"'#()[]{}=-+%*/&|^~!<>;,.:?",    /* token starting chars */    *begtk = "ABCDEFGHIJKLMNOPQRSTUVWXYZ_abcdefghijklmnopqrstuvwxyz$~@",    /* valid in-token chars */ @@ -285,14 +324,15 @@ char  bool append_to_tagfile;		/* -a: append to tags */  /* The following four default to TRUE for etags, but to FALSE for ctags.  */ -bool typedefs;			/* -t: create tags for C typedefs */ +bool typedefs;			/* -t: create tags for C and Ada typedefs */  bool typedefs_and_cplusplus;	/* -T: create tags for C typedefs, level */  				/* 0 struct/enum/union decls, and C++ */  				/* member functions. */  bool constantypedefs;		/* -d: create tags for C #define, enum */  				/* constants and variables. */  				/* -D: opposite of -d.  Default under ctags. */ -bool globals;			/* create tags for C global variables */ +bool declarations;		/* --declarations: tag them and extern in C&Co*/ +bool globals;			/* create tags for global variables */  bool members;			/* create tags for C member variables */  bool update;			/* -u: update tags */  bool vgrind_style;		/* -v: create vgrind style index output */ @@ -300,64 +340,87 @@ bool no_warnings;		/* -w: suppress warnings */  bool cxref_style;		/* -x: create cxref style output */  bool cplusplus;			/* .[hc] means C++, not C */  bool noindentypedefs;		/* -I: ignore indentation in C */ +bool packages_only;		/* --packages-only: in Ada, only tag packages*/  #ifdef LONG_OPTIONS  struct option longopts[] =  { -  { "append",			no_argument,	   NULL,     'a'   }, -  { "backward-search",		no_argument,	   NULL,     'B'   }, -  { "c++",			no_argument,	   NULL,     'C'   }, -  { "cxref",			no_argument,	   NULL,     'x'   }, -  { "defines",			no_argument,	   NULL,     'd'   }, -  { "no-defines",		no_argument,	   NULL,     'D'   }, -  { "globals",			no_argument,	   &globals, TRUE  }, -  { "no-globals",		no_argument,	   &globals, FALSE }, -  { "help",			no_argument,	   NULL,     'h'   }, -  { "help",			no_argument,	   NULL,     'H'   }, -  { "ignore-indentation",	no_argument,	   NULL,     'I'   }, -  { "include",			required_argument, NULL,     'i'   }, -  { "language",                 required_argument, NULL,     'l'   }, -  { "members",			no_argument,	   &members, TRUE  }, -  { "no-members",		no_argument,	   &members, FALSE }, -  { "no-warn",			no_argument,	   NULL,     'w'   }, -  { "output",			required_argument, NULL,     'o'   }, -#ifdef ETAGS_REGEXPS   -  { "regex",			required_argument, NULL,     'r'   }, -  { "no-regex",			no_argument,	   NULL,     'R'   }, -#endif /* ETAGS_REGEXPS */   -  { "typedefs",			no_argument,	   NULL,     't'   }, -  { "typedefs-and-c++",		no_argument,	   NULL,     'T'   }, -  { "update",			no_argument,	   NULL,     'u'   }, -  { "version",			no_argument,	   NULL,     'V'   }, -  { "vgrind",			no_argument,	   NULL,     'v'   }, -  { 0 } +  { "packages-only",      no_argument,	     &packages_only, TRUE  }, +  { "append",		  no_argument,	     NULL,	     'a'   }, +  { "backward-search",	  no_argument,	     NULL,	     'B'   }, +  { "c++",		  no_argument,	     NULL,	     'C'   }, +  { "cxref",		  no_argument,	     NULL,	     'x'   }, +  { "defines",		  no_argument,	     NULL,	     'd'   }, +  { "declarations",	  no_argument,	     &declarations,  TRUE  }, +  { "no-defines",	  no_argument,	     NULL,	     'D'   }, +  { "globals",		  no_argument,	     &globals, 	     TRUE  }, +  { "no-globals",	  no_argument,	     &globals, 	     FALSE }, +  { "help",		  no_argument,	     NULL,     	     'h'   }, +  { "help",		  no_argument,	     NULL,     	     'H'   }, +  { "ignore-indentation", no_argument,	     NULL,     	     'I'   }, +  { "include",		  required_argument, NULL,     	     'i'   }, +  { "language",           required_argument, NULL,     	     'l'   }, +  { "members",		  no_argument,	     &members, 	     TRUE  }, +  { "no-members",	  no_argument,	     &members, 	     FALSE }, +  { "no-warn",		  no_argument,	     NULL,	     'w'   }, +  { "output",		  required_argument, NULL,	     'o'   }, +#ifdef ETAGS_REGEXPS +  { "regex",		  required_argument, NULL,	     'r'   }, +  { "no-regex",		  no_argument,	     NULL,	     'R'   }, +  { "ignore-case-regex",  required_argument, NULL,	     'c'   }, +#endif /* ETAGS_REGEXPS */ +  { "typedefs",		  no_argument,	     NULL,	     't'   }, +  { "typedefs-and-c++",	  no_argument,	     NULL,     	     'T'   }, +  { "update",		  no_argument,	     NULL,     	     'u'   }, +  { "version",		  no_argument,	     NULL,     	     'V'   }, +  { "vgrind",		  no_argument,	     NULL,     	     'v'   }, +  { NULL }  };  #endif /* LONG_OPTIONS */  #ifdef ETAGS_REGEXPS  /* Structure defining a regular expression.  Elements are     the compiled pattern, and the name string. */ -struct pattern +typedef struct pattern  { +  struct pattern *p_next; +  language *language; +  char *regex;    struct re_pattern_buffer *pattern;    struct re_registers regs;    char *name_pattern;    bool error_signaled; -}; +} pattern; -/* Number of regexps found. */ -int num_patterns = 0; +/* List of all regexps. */ +pattern *p_head = NULL; -/* Array of all regexps. */ -struct pattern *patterns = NULL; +/* How many characters in the character set.  (From regex.c.)  */ +#define CHAR_SET_SIZE 256 +/* Translation table for case-insensitive matching. */ +char lc_trans[CHAR_SET_SIZE];  #endif /* ETAGS_REGEXPS */ +compressor compressors[] = +{ +  { "z", "gzip -d -c"}, +  { "Z", "gzip -d -c"}, +  { "gz", "gzip -d -c"}, +  { "GZ", "gzip -d -c"}, +  { "bz2", "bzip2 -d -c" }, +  { NULL } +}; +  /*   * Language stuff.   */  /* Non-NULL if language fixed. */ -Lang_function *lang_func = NULL; +language *forced_lang = NULL; + +/* Ada code */ +char *Ada_suffixes [] = +  { "ads", "adb", "ada", NULL };  /* Assembly code */  char *Asm_suffixes [] = { "a",	/* Unix assembler */ @@ -415,14 +478,17 @@ char *plain_C_suffixes [] =       NULL };  char *Postscript_suffixes [] = -  { "ps", NULL }; +  { "ps", "psw", NULL };	/* .psw is for PSWrap */  char *Prolog_suffixes [] =    { "prolog", NULL }; +char *Python_suffixes [] = +  { "py", NULL }; +  /* Can't do the `SCM' or `scm' prefix with a version number. */  char *Scheme_suffixes [] = -  { "SCM", "SM", "oak", "sch", "scheme", "scm", "sm", "t", NULL }; +  { "SCM", "SM", "oak", "sch", "scheme", "scm", "sm", "ss", "t", NULL };  char *TeX_suffixes [] =    { "TeX", "bib", "clo", "cls", "ltx", "sty", "tex", NULL }; @@ -430,20 +496,16 @@ char *TeX_suffixes [] =  char *Yacc_suffixes [] =    { "y", "ym", "yy", "yxx", "y++", NULL }; /* .ym is Objective yacc file */ -/* Table of language names and corresponding functions, file suffixes -   and interpreter names. -   It is ok for a given function to be listed under more than one -   name.  I just didn't. */ -struct lang_entry -{ -  char *name; -  Lang_function *function; -  char **suffixes; -  char **interpreters; -}; +/* + * Table of languages. + * + * It is ok for a given function to be listed under more than one + * name.  I just didn't. + */ -struct lang_entry lang_names [] = +language lang_names [] =  { +  { "ada",     Ada_funcs,           Ada_suffixes,         NULL              },    { "asm",     Asm_labels,          Asm_suffixes,         NULL              },    { "c",       default_C_entries,   default_C_suffixes,   NULL              },    { "c++",     Cplusplus_entries,   Cplusplus_suffixes,   NULL              }, @@ -458,6 +520,7 @@ struct lang_entry lang_names [] =    { "postscript", Postscript_functions, Postscript_suffixes, NULL           },    { "proc",    plain_C_entries,     plain_C_suffixes,     NULL              },    { "prolog",  Prolog_functions,    Prolog_suffixes,      NULL              }, +  { "python",  Python_functions,    Python_suffixes,      NULL              },    { "scheme",  Scheme_functions,    Scheme_suffixes,      NULL              },    { "tex",     TeX_functions,       TeX_suffixes,         NULL              },    { "yacc",    Yacc_entries,        Yacc_suffixes,        NULL              }, @@ -465,12 +528,11 @@ struct lang_entry lang_names [] =    { "none", just_read_file },   /* regexp matching only */    { NULL, NULL }                /* end of list */  }; -  void  print_language_names ()  { -  struct lang_entry *lang; +  language *lang;    char **ext;    puts ("\nThese are the currently supported languages, along with the\n\ @@ -488,11 +550,12 @@ name suffix, and `none' means only do regexp processing on files.\n\  If no language is specified and no matching suffix is found,\n\  the first line of the file is read for a sharp-bang (#!) sequence\n\  followed by the name of an interpreter.  If no such sequence is found,\n\ -Fortran is tried first; if no tags are found, C is tried next."); +Fortran is tried first; if no tags are found, C is tried next.\n\ +Compressed files are supported using gzip and bzip2.");  }  #ifndef VERSION -# define VERSION "19" +# define VERSION "20"  #endif  void  print_version () @@ -516,15 +579,18 @@ These are the options accepted by %s.\n", progname, progname);    puts ("Long option names do not work with this executable, as it is not\n\  linked with GNU getopt.");  #endif /* LONG_OPTIONS */ -  puts ("A - as file name means read names from stdin."); +  puts ("A - as file name means read names from stdin (one per line).");    if (!CTAGS) -    printf ("  Absolute names are stored in the output file as they\n\ -are.  Relative ones are stored relative to the output file's directory."); +    printf ("  Absolute names are stored in the output file as they are.\n\ +Relative ones are stored relative to the output file's directory.");    puts ("\n");    puts ("-a, --append\n\          Append tag entries to existing tags file."); +  puts ("--packages-only\n\ +        For Ada files, only generate tags for packages ."); +    if (CTAGS)      puts ("-B, --backward-search\n\          Write the search commands for the tag entries using '?', the\n\ @@ -533,6 +599,14 @@ are.  Relative ones are stored relative to the output file's directory.");    puts ("-C, --c++\n\          Treat files whose name suffix defaults to C language as C++ files."); +  puts ("--declarations\n\ +	In C and derived languages, create tags for function declarations,"); +  if (CTAGS) +    puts ("\tand create tags for extern variables if --globals is used."); +  else +    puts +      ("\tand create tags for extern variables unless --no-globals is used."); +    if (CTAGS)      puts ("-d, --defines\n\          Create tag entries for C #define constants and enum constants, too."); @@ -554,22 +628,25 @@ are.  Relative ones are stored relative to the output file's directory.");    if (CTAGS)      puts ("--globals\n\ -	Create tag entries for global variables in C and derived languages."); +	Create tag entries for global variables in some languages.");    else      puts ("--no-globals\n\ -	Do not create tag entries for global variables in C and\n\ -	derived languages.  This makes the tags file smaller."); +	Do not create tag entries for global variables in some\n\ +	languages.  This makes the tags file smaller.");    puts ("--members\n\  	Create tag entries for member variables in C and derived languages.");  #ifdef ETAGS_REGEXPS    puts ("-r /REGEXP/, --regex=/REGEXP/ or --regex=@regexfile\n\ -        Make a tag for each line matching pattern REGEXP in the\n\ - 	following files.  regexfile is a file containing one REGEXP\n\ -	per line.  REGEXP is anchored (as if preceded by ^).\n\ -	The form /REGEXP/NAME/ creates a named tag.  For example Tcl\n\ -	named tags can be created with:\n\ +        Make a tag for each line matching pattern REGEXP in the following\n\ + 	files.  {LANGUAGE}/REGEXP/ uses REGEXP for LANGUAGE files only.\n\ +	regexfile is a file containing one REGEXP per line.\n\ +	REGEXP is anchored (as if preceded by ^).\n\ +	The form /REGEXP/NAME/ creates a named tag.\n\ +	For example Tcl named tags can be created with:\n\  	--regex=/proc[ \\t]+\\([^ \\t]+\\)/\\1/."); +  puts ("-c /REGEXP/, --ignore-case-regex=/REGEXP/ or --ignore-case-regex=@regexfile\n\ +        Like -r, --regex but ignore case when matching expressions.");    puts ("-R, --no-regex\n\          Don't create tags from regexps for the following files.");  #endif /* ETAGS_REGEXPS */ @@ -584,7 +661,7 @@ are.  Relative ones are stored relative to the output file's directory.");    if (CTAGS)      {        puts ("-t, --typedefs\n\ -        Generate tag entries for C typedefs."); +        Generate tag entries for C and Ada typedefs.");        puts ("-T, --typedefs-and-c++\n\          Generate tag entries for C typedefs, C struct/enum/union tags,\n\          and C++ member functions."); @@ -627,7 +704,8 @@ enum argument_type  {    at_language,    at_regexp, -  at_filename +  at_filename, +  at_icregexp  };  /* This structure helps us allow mixing of --lang and file names. */ @@ -635,7 +713,7 @@ typedef struct  {    enum argument_type arg_type;    char *what; -  Lang_function *function; +  language *lang;		/* language of the regexp */  } argument;  #ifdef VMS			/* VMS specific functions */ @@ -774,7 +852,7 @@ main (argc, argv)    char *this_file;    argument *argbuffer;    int current_arg, file_count; -  struct linebuffer filename_lb; +  linebuffer filename_lb;  #ifdef VMS    bool got_err;  #endif @@ -795,13 +873,16 @@ main (argc, argv)  #ifdef ETAGS_REGEXPS    /* Set syntax for regular expression routines. */ -  re_set_syntax (RE_SYNTAX_EMACS); +  re_set_syntax (RE_SYNTAX_EMACS | RE_INTERVALS); +  /* Translation table for case-insensitive search. */ +  for (i = 0; i < CHAR_SET_SIZE; i++) +    lc_trans[i] = lowcase (i);  #endif /* ETAGS_REGEXPS */    /*     * If etags, always find typedefs and structure tags.  Why not?     * Also default is to find macro constants, enum constants and -   * global variables.  +   * global variables.     */    if (!CTAGS)      { @@ -816,7 +897,7 @@ main (argc, argv)        char *optstring;  #ifdef ETAGS_REGEXPS -      optstring = "-aCdDf:Il:o:r:RStTi:BuvxwVhH"; +      optstring = "-aCdDf:Il:o:r:c:RStTi:BuvxwVhH";  #else        optstring = "-aCdDf:Il:o:StTi:BuvxwVhH";  #endif /* ETAGS_REGEXPS */ @@ -863,9 +944,15 @@ main (argc, argv)  	  noindentypedefs = TRUE;  	  break;  	case 'l': -	  argbuffer[current_arg].function = get_language_from_name (optarg); -	  argbuffer[current_arg].arg_type = at_language; -	  ++current_arg; +	  { +	    language *lang = get_language_from_name (optarg); +	    if (lang != NULL) +	      { +		argbuffer[current_arg].lang = lang; +		argbuffer[current_arg].arg_type = at_language; +		++current_arg; +	      } +	  }  	  break;  #ifdef ETAGS_REGEXPS  	case 'r': @@ -878,6 +965,11 @@ main (argc, argv)  	  argbuffer[current_arg].what = NULL;  	  ++current_arg;  	  break; +        case 'c': +	  argbuffer[current_arg].arg_type = at_icregexp; +	  argbuffer[current_arg].what = optarg; +	  ++current_arg; +	  break;  #endif /* ETAGS_REGEXPS */  	case 'V':  	  print_version (); @@ -972,11 +1064,14 @@ main (argc, argv)        switch (argbuffer[i].arg_type)  	{  	case at_language: -	  lang_func = argbuffer[i].function; +	  forced_lang = argbuffer[i].lang;  	  break;  #ifdef ETAGS_REGEXPS  	case at_regexp: -	  analyse_regex (argbuffer[i].what); +	  analyse_regex (argbuffer[i].what, FALSE); +	  break; +	case at_icregexp: +	  analyse_regex (argbuffer[i].what, TRUE);  	  break;  #endif  	case at_filename: @@ -996,7 +1091,7 @@ main (argc, argv)  	      this_file = argbuffer[i].what;  #endif  	      /* Input file named "-" means read file names from stdin -		 and use them. */ +		 (one per line) and use them. */  	      if (streq (this_file, "-"))  		while (readline_internal (&filename_lb, stdin) > 0)  		  process_file (filename_lb.buffer); @@ -1009,6 +1104,10 @@ main (argc, argv)  	}      } +#ifdef ETAGS_REGEXPS +  free_patterns (); +#endif /* ETAGS_REGEXPS */ +    if (!CTAGS)      {        while (nincluded_files-- > 0) @@ -1023,6 +1122,8 @@ main (argc, argv)    if (cxref_style)      {        put_entries (head); +      free_tree (head); +      head = NULL;        exit (GOOD);      } @@ -1046,6 +1147,8 @@ main (argc, argv)    if (tagf == NULL)      pfatal (tagfile);    put_entries (head); +  free_tree (head); +  head = NULL;    fclose (tagf);    if (update) @@ -1058,41 +1161,81 @@ main (argc, argv)  } + +/* + * Return a compressor given the file name.  If EXTPTR is non-zero, + * return a pointer into FILE where the compressor-specific + * extension begins.  If no compressor is found, NULL is returned + * and EXTPTR is not significant. + * Idea by Vladimir Alexiev <vladimir@cs.ualberta.ca> + */ +compressor * +get_compressor_from_suffix (file, extptr) +     char *file; +     char **extptr; +{ +  compressor *compr; +  char *slash, *suffix; + +  /* This relies on FN to be after canonicalize_filename, +     so we don't need to consider backslashes on DOS_NT.  */ +  slash = etags_strrchr (file, '/'); +  suffix = etags_strrchr (file, '.'); +  if (suffix == NULL || suffix < slash) +    return NULL; +  if (extptr != NULL) +    *extptr = suffix; +  suffix += 1; +  /* Let those poor souls who live with DOS 8+3 file name limits get +     some solace by treating foo.cgz as if it were foo.c.gz, etc. +     Only the first do loop is run if not MSDOS */ +  do +    { +      for (compr = compressors; compr->suffix != NULL; compr++) +	if (streq (compr->suffix, suffix)) +	  return compr; +#ifndef MSDOS +      break; +#endif +      if (extptr != NULL) +	*extptr = ++suffix; +    } while (*suffix != '\0'); +  return NULL; +} + + +  /* - * Return a Lang_function given the name. + * Return a language given the name.   */ -Lang_function * +language *  get_language_from_name (name)       char *name;  { -  struct lang_entry *lang; +  language *lang; -  if (name != NULL) -    for (lang = lang_names; lang->name != NULL; lang++) -      { +  if (name == NULL) +    error ("empty language name", (char *)NULL); +  else +    { +      for (lang = lang_names; lang->name != NULL; lang++)  	if (streq (name, lang->name)) -	  return lang->function; -      } - -  error ("language \"%s\" not recognized.", optarg); -  suggest_asking_for_help (); +	  return lang; +      error ("unknown language \"%s\"", name); +    } -  /* This point should never be reached.  The function should either -     return a function pointer  or never return.  Note that a NULL -     pointer cannot be considered as an error, as it means that the -     language has not been explicitely imposed by the user ("auto"). */ -  return NULL;			/* avoid warnings from compiler */ +  return NULL;  }  /* - * Return a Lang_function given the interpreter name. + * Return a language given the interpreter name.   */ -Lang_function * +language *  get_language_from_interpreter (interpreter)       char *interpreter;  { -  struct lang_entry *lang; +  language *lang;    char **iname;    if (interpreter == NULL) @@ -1101,7 +1244,7 @@ get_language_from_interpreter (interpreter)      if (lang->interpreters != NULL)        for (iname = lang->interpreters; *iname != NULL; iname++)  	if (streq (*iname, interpreter)) -	    return lang->function; +	    return lang;    return NULL;  } @@ -1109,27 +1252,29 @@ get_language_from_interpreter (interpreter)  /* - * Return a Lang_function given the file suffix. + * Return a language given the file name.   */ -Lang_function * -get_language_from_suffix (suffix) -     char *suffix; +language * +get_language_from_suffix (file) +     char *file;  { -  struct lang_entry *lang; -  char **ext; +  language *lang; +  char **ext, *suffix; +  suffix = etags_strrchr (file, '.');    if (suffix == NULL)      return NULL; +  suffix += 1;    for (lang = lang_names; lang->name != NULL; lang++)      if (lang->suffixes != NULL)        for (ext = lang->suffixes; *ext != NULL; ext++)  	if (streq (*ext, suffix)) -	    return lang->function; - +	  return lang;    return NULL;  } +  /*   * This routine is called on each file argument.   */ @@ -1139,47 +1284,136 @@ process_file (file)  {    struct stat stat_buf;    FILE *inf; -#ifdef DOS_NT -  char *p; +  compressor *compr; +  char *compressed_name, *uncompressed_name; +  char *ext, *real_name; -  for (p = file; *p != '\0'; p++) -    if (*p == '\\') -      *p = '/'; -#endif -  if (stat (file, &stat_buf) == 0 && !S_ISREG (stat_buf.st_mode)) -    { -      error ("skipping %s: it is not a regular file.", file); -      return; -    } +  canonicalize_filename (file);    if (streq (file, tagfile) && !streq (tagfile, "-"))      {        error ("skipping inclusion of %s in self.", file);        return;      } -  inf = fopen (file, "r"); +  if ((compr = get_compressor_from_suffix (file, &ext)) == NULL) +    { +      compressed_name = NULL; +      real_name = uncompressed_name = savestr (file); +    } +  else +    { +      real_name = compressed_name = savestr (file); +      uncompressed_name = savenstr (file, ext - file); +    } + +  /* If the canonicalised uncompressed name has already be dealt with, +     skip it silently, else add it to the list. */ +  { +    typedef struct processed_file +    { +      char *filename; +      struct processed_file *next; +    } processed_file; +    static processed_file *pf_head = NULL; +    register processed_file *fnp; + +    for (fnp = pf_head; fnp != NULL; fnp = fnp->next) +      if (streq (uncompressed_name, fnp->filename)) +	goto exit; +    fnp = pf_head; +    pf_head = xnew (1, struct processed_file); +    pf_head->filename = savestr (uncompressed_name); +    pf_head->next = fnp; +  } + +  if (stat (real_name, &stat_buf) != 0) +    { +      /* Reset real_name and try with a different name. */ +      real_name = NULL; +      if (compressed_name != NULL) /* try with the given suffix */ +	{ +	  if (stat (uncompressed_name, &stat_buf) == 0) +	    real_name = uncompressed_name; +	} +      else			/* try all possible suffixes */ +	{ +	  for (compr = compressors; compr->suffix != NULL; compr++) +	    { +	      compressed_name = concat (file, ".", compr->suffix); +	      if (stat (compressed_name, &stat_buf) != 0) +		{ +#ifdef MSDOS +		  char *suf = compressed_name + strlen (file); +		  size_t suflen = strlen (compr->suffix) + 1; +		  for ( ; suf[1]; suf++, suflen--) +		    { +		      memmove (suf, suf + 1, suflen); +		      if (stat (compressed_name, &stat_buf) == 0) +			{ +			  real_name = compressed_name; +			  break; +			} +		    } +		  if (real_name != NULL) +		    break; +#endif +		  free (compressed_name); +		  compressed_name = NULL; +		} +	      else +		{ +		  real_name = compressed_name; +		  break; +		} +	    } +	} +      if (real_name == NULL) +	{ +	  perror (file); +	  goto exit; +	} +    } /* try with a different name */ + +  if (!S_ISREG (stat_buf.st_mode)) +    { +      error ("skipping %s: it is not a regular file.", real_name); +      goto exit; +    } +  if (real_name == compressed_name) +    { +      char *cmd = concat (compr->command, " ", real_name); +      inf = popen (cmd, "r"); +      free (cmd); +    } +  else +    inf = fopen (real_name, "r");    if (inf == NULL)      { -      perror (file); -      return; +      perror (real_name); +      goto exit;      } -  find_entries (file, inf); +  find_entries (uncompressed_name, inf); + +  if (real_name == compressed_name) +    pclose (inf); +  else +    fclose (inf);    if (!CTAGS)      {        char *filename; -      if (absolutefn (file)) +      if (filename_is_absolute (uncompressed_name))  	{  	  /* file is an absolute file name.  Canonicalise it. */ -	  filename = absolute_filename (file, cwd); +	  filename = absolute_filename (uncompressed_name, cwd);  	}        else  	{  	  /* file is a file name relative to cwd.  Make it relative  	     to the directory of the tags file. */ -	  filename = relative_filename (file, tagfiledir); +	  filename = relative_filename (uncompressed_name, tagfiledir);  	}        fprintf (tagf, "\f\n%s,%d\n", filename, total_size_of_entries (head));        free (filename); @@ -1187,11 +1421,16 @@ process_file (file)        free_tree (head);        head = NULL;      } + + exit: +  if (compressed_name) free(compressed_name); +  if (uncompressed_name) free(uncompressed_name); +  return;  }  /*   * This routine sets up the boolean pseudo-functions which work - * by setting boolean flags dependent upon the corresponding character + * by setting boolean flags dependent upon the corresponding character.   * Every char which is NOT in that string is not a white char.  Therefore,   * all of the array "_wht" is set to FALSE, and then the elements   * subscripted by the chars in "white" are set to TRUE.  Thus "_wht" @@ -1204,58 +1443,61 @@ init ()    register int i;    for (i = 0; i < CHARS; i++) -    _wht[i] = _nin[i] = _etk[i] = _itk[i] = _btk[i] = FALSE; -  for (sp = white; *sp; sp++) _wht[*sp] = TRUE;    _wht[0] = _wht['\n']; -  for (sp = nonam; *sp; sp++) _nin[*sp] = TRUE;    _nin[0] = _nin['\n']; -  for (sp = endtk; *sp; sp++) _etk[*sp] = TRUE;    _etk[0] = _etk['\n']; -  for (sp = midtk; *sp; sp++) _itk[*sp] = TRUE;    _btk[0] = _btk['\n']; -  for (sp = begtk; *sp; sp++) _btk[*sp] = TRUE;    _itk[0] = _itk['\n']; +    iswhite(i) = notinname(i) = begtoken(i) = intoken(i) = endtoken(i) = FALSE; +  for (sp = white; *sp != '\0'; sp++) iswhite (*sp) = TRUE; +  for (sp = nonam; *sp != '\0'; sp++) notinname (*sp) = TRUE; +  for (sp = begtk; *sp != '\0'; sp++) begtoken (*sp) = TRUE; +  for (sp = midtk; *sp != '\0'; sp++) intoken (*sp) = TRUE; +  for (sp = endtk; *sp != '\0'; sp++) endtoken (*sp) = TRUE; +  iswhite('\0') = iswhite('\n'); +  notinname('\0') = notinname('\n'); +  begtoken('\0') = begtoken('\n'); +  intoken('\0') = intoken('\n'); +  endtoken('\0') = endtoken('\n');  }  /*   * This routine opens the specified file and calls the function   * which finds the function and type definitions.   */ +node *last_node = NULL; +  void  find_entries (file, inf)       char *file;       FILE *inf;  {    char *cp; -  Lang_function *function; -  NODE *old_last_node; -  extern NODE *last_node; - - -  /* Memory leakage here: the memory block pointed by curfile is never -     released.  The amount of memory leaked here is the sum of the -     lengths of the input file names. */ +  language *lang; +  node *old_last_node; + +  /* Memory leakage here: the string pointed by curfile is +     never released, because curfile is copied into np->file +     for each node, to be used in CTAGS mode.  The amount of +     memory leaked here is the sum of the lengths of the +     file names. */    curfile = savestr (file);    /* If user specified a language, use it. */ -  function = lang_func; -  if (function != NULL) +  lang = forced_lang; +  if (lang != NULL && lang->function != NULL)      { -      function (inf); -      fclose (inf); +      curlang = lang; +      lang->function (inf);        return;      } -  cp = etags_strrchr (file, '.'); -  if (cp != NULL) +  /* Try to guess the language given the file name. */ +  lang = get_language_from_suffix (file); +  if (lang != NULL && lang->function != NULL)      { -      cp += 1; -      function = get_language_from_suffix (cp); -      if (function != NULL) -	{ -	  function (inf); -	  fclose (inf); -	  return; -	} +      curlang = lang; +      lang->function (inf); +      return;      }    /* Look for sharp-bang as the first two characters. */ -  if (readline_internal (&lb, inf) +  if (readline_internal (&lb, inf) > 0        && lb.len >= 2        && lb.buffer[0] == '#'        && lb.buffer[1] == '!') @@ -1269,36 +1511,40 @@ find_entries (file, inf)        if (lp != NULL)  	lp += 1;        else -	for (lp = lb.buffer+2; *lp != '\0' && isspace (*lp); lp++) -	  continue; -      for (cp = lp; *cp != '\0' && !isspace (*cp); cp++) -	continue; +	lp = skip_spaces (lb.buffer + 2); +      cp = skip_non_spaces (lp);        *cp = '\0';        if (strlen (lp) > 0)  	{ -	  function = get_language_from_interpreter (lp); -	  if (function != NULL) +	  lang = get_language_from_interpreter (lp); +	  if (lang != NULL && lang->function != NULL)  	    { -	      function (inf); -	      fclose (inf); +	      curlang = lang; +	      lang->function (inf);  	      return;  	    }  	}      } +  /* We rewind here, even if inf may be a pipe.  We fail if the +     length of the first line is longer than the pipe block size, +     which is unlikely. */    rewind (inf);    /* Try Fortran. */    old_last_node = last_node; +  curlang = get_language_from_name ("fortran");    Fortran_functions (inf);    /* No Fortran entries found.  Try C. */    if (old_last_node == last_node)      { +      /* We do not tag if rewind fails. +	 Only the file name will be recorded in the tags file. */        rewind (inf); +      curlang = get_language_from_name (cplusplus ? "c++" : "c");        default_C_entries (inf);      } -  fclose (inf);    return;  } @@ -1312,21 +1558,21 @@ pfnote (name, is_func, linestart, linelen, lno, cno)       int lno;			/* line number */       long cno;			/* character number */  { -  register NODE *np; +  register node *np;    if (CTAGS && name == NULL)      return; -  np = xnew (1, NODE); +  np = xnew (1, node);    /* If ctags mode, change name "main" to M<thisfilename>. */    if (CTAGS && !cxref_style && streq (name, "main"))      {        register char *fp = etags_strrchr (curfile, '/'); -      np->name = concat ("M", fp == 0 ? curfile : fp + 1, ""); +      np->name = concat ("M", fp == NULL ? curfile : fp + 1, "");        fp = etags_strrchr (np->name, '.'); -      if (fp && fp[1] != '\0' && fp[2] == '\0') -	fp[0] = 0; +      if (fp != NULL && fp[1] != '\0' && fp[2] == '\0') +	fp[0] = '\0';      }    else      np->name = name; @@ -1354,19 +1600,23 @@ pfnote (name, is_func, linestart, linelen, lno, cno)    add_node (np, &head);  } -/* Date: Wed, 22 Jan 1997 02:56:31 -0500 - * From: Sam Kendall <kendall@cybercom.net> +/* Date: Wed, 22 Jan 1997 02:56:31 -0500 [last amended 18 Sep 1997] + * From: Sam Kendall <kendall@mv.mv.com>   * Subject: Proposal for firming up the TAGS format specification   * To: F.Potorti@cnuce.cnr.it   *   * pfnote should emit the optimized form [unnamed tag] only if: - *  1. name does not contain any of the characters " \t\r\n()"; + *  1. name does not contain any of the characters " \t\r\n(),;";   *  2. linestart contains name as either a rightmost, or rightmost but   *     one character, substring;   *  3. the character, if any, immediately before name in linestart must - *     be one of the characters " \t()"; + *     be one of the characters " \t(),;";   *  4. the character, if any, immediately after name in linestart must - *     also be one of the characters " \t()". + *     also be one of the characters " \t(),;". + * + * The real implementation uses the notinname() macro, which recognises + * characters slightly different form " \t\r\n(),;".  See the variable + * `nonam'.   */  #define traditional_tag_style TRUE  void @@ -1399,7 +1649,7 @@ new_pfnote (name, namelen, is_func, linestart, linelen, lno, cno)  	    named = FALSE;	/* use unnamed tag */  	}      } -   +    if (named)      name = savenstr (name, namelen);    else @@ -1412,18 +1662,18 @@ new_pfnote (name, namelen, is_func, linestart, linelen, lno, cno)   *	recurse on left children, iterate on right children.   */  void -free_tree (node) -     register NODE *node; +free_tree (np) +     register node *np;  { -  while (node) +  while (np)      { -      register NODE *node_right = node->right; -      free_tree (node->left); -      if (node->name != NULL) -	free (node->name); -      free (node->pat); -      free ((char *) node); -      node = node_right; +      register node *node_right = np->right; +      free_tree (np->left); +      if (np->name != NULL) +	free (np->name); +      free (np->pat); +      free (np); +      np = node_right;      }  } @@ -1436,18 +1686,17 @@ free_tree (node)   *	add_node is the only function allowed to add nodes, so it can   *	maintain state.   */ -NODE *last_node = NULL;  void -add_node (node, cur_node_p) -     NODE *node, **cur_node_p; +add_node (np, cur_node_p) +     node *np, **cur_node_p;  {    register int dif; -  register NODE *cur_node = *cur_node_p; +  register node *cur_node = *cur_node_p;    if (cur_node == NULL)      { -      *cur_node_p = node; -      last_node = node; +      *cur_node_p = np; +      last_node = np;        return;      } @@ -1456,13 +1705,13 @@ add_node (node, cur_node_p)        /* Etags Mode */        if (last_node == NULL)  	fatal ("internal error in add_node", (char *)NULL); -      last_node->right = node; -      last_node = node; +      last_node->right = np; +      last_node = np;      }    else      {        /* Ctags Mode */ -      dif = strcmp (node->name, cur_node->name); +      dif = strcmp (np->name, cur_node->name);        /*         * If this tag name matches an existing one, then @@ -1470,12 +1719,12 @@ add_node (node, cur_node_p)         */        if (!dif)  	{ -	  if (streq (node->file, cur_node->file)) +	  if (streq (np->file, cur_node->file))  	    {  	      if (!no_warnings)  		{  		  fprintf (stderr, "Duplicate entry in file %s, line %d: %s\n", -			   node->file, lineno, node->name); +			   np->file, lineno, np->name);  		  fprintf (stderr, "Second entry ignored\n");  		}  	    } @@ -1484,64 +1733,64 @@ add_node (node, cur_node_p)  	      fprintf  		(stderr,  		 "Duplicate entry in files %s and %s: %s (Warning only)\n", -		 node->file, cur_node->file, node->name); +		 np->file, cur_node->file, np->name);  	      cur_node->been_warned = TRUE;  	    }  	  return;  	}        /* Actually add the node */ -      add_node (node, dif < 0 ? &cur_node->left : &cur_node->right); +      add_node (np, dif < 0 ? &cur_node->left : &cur_node->right);      }  }  void -put_entries (node) -     register NODE *node; +put_entries (np) +     register node *np;  {    register char *sp; -  if (node == NULL) +  if (np == NULL)      return;    /* Output subentries that precede this one */ -  put_entries (node->left); +  put_entries (np->left);    /* Output this entry */    if (!CTAGS)      { -      if (node->name != NULL) +      if (np->name != NULL)  	fprintf (tagf, "%s\177%s\001%d,%ld\n", -		 node->pat, node->name, node->lno, node->cno); +		 np->pat, np->name, np->lno, np->cno);        else  	fprintf (tagf, "%s\177%d,%ld\n", -		 node->pat, node->lno, node->cno); +		 np->pat, np->lno, np->cno);      }    else      { -      if (node->name == NULL) +      if (np->name == NULL)  	error ("internal error: NULL name in ctags mode.", (char *)NULL);        if (cxref_style)  	{  	  if (vgrind_style)  	    fprintf (stdout, "%s %s %d\n", -		     node->name, node->file, (node->lno + 63) / 64); +		     np->name, np->file, (np->lno + 63) / 64);  	  else  	    fprintf (stdout, "%-16s %3d %-16s %s\n", -		     node->name, node->lno, node->file, node->pat); +		     np->name, np->lno, np->file, np->pat);  	}        else  	{ -	  fprintf (tagf, "%s\t%s\t", node->name, node->file); +	  fprintf (tagf, "%s\t%s\t", np->name, np->file); -	  if (node->is_func) +	  if (np->is_func)  	    {			/* a function */  	      putc (searchar, tagf);  	      putc ('^', tagf); -	      for (sp = node->pat; *sp; sp++) +	      for (sp = np->pat; *sp; sp++)  		{  		  if (*sp == '\\' || *sp == searchar)  		    putc ('\\', tagf); @@ -1551,14 +1800,14 @@ put_entries (node)  	    }  	  else  	    {			/* a typedef; text pattern inadequate */ -	      fprintf (tagf, "%d", node->lno); +	      fprintf (tagf, "%d", np->lno);  	    }  	  putc ('\n', tagf);  	}      }    /* Output subentries that follow this one */ -  put_entries (node->right); +  put_entries (np->right);  }  /* Length of a number's decimal representation. */ @@ -1566,11 +1815,9 @@ int  number_len (num)       long num;  { -  int len = 0; -  if (!num) -    return 1; -  for (; num; num /= 10) -    ++len; +  int len = 1; +  while ((num /= 10) > 0) +    len += 1;    return len;  } @@ -1582,25 +1829,24 @@ number_len (num)   * backward compatibility.   */  int -total_size_of_entries (node) -     register NODE *node; +total_size_of_entries (np) +     register node *np;  {    register int total; -  if (node == NULL) +  if (np == NULL)      return 0; -  total = 0; -  for (; node; node = node->right) +  for (total = 0; np != NULL; np = np->right)      {        /* Count left subentries. */ -      total += total_size_of_entries (node->left); +      total += total_size_of_entries (np->left);        /* Count this entry */ -      total += strlen (node->pat) + 1; -      total += number_len ((long) node->lno) + 1 + number_len (node->cno) + 1; -      if (node->name != NULL) -	total += 1 + strlen (node->name);	/* \001name */ +      total += strlen (np->pat) + 1; +      total += number_len ((long) np->lno) + 1 + number_len (np->cno) + 1; +      if (np->name != NULL) +	total += 1 + strlen (np->name);	/* \001name */      }    return total; @@ -1616,7 +1862,8 @@ enum sym_type    st_C_gnumacro,    st_C_ignore,    st_C_javastruct, -  st_C_struct, st_C_enum, st_C_define, st_C_typedef, st_C_typespec +  st_C_operator, +  st_C_struct, st_C_extern, st_C_enum, st_C_define, st_C_typedef, st_C_typespec  };  /* Feed stuff between (but not including) %[ and %] lines to: @@ -1624,6 +1871,11 @@ enum sym_type  %[  struct C_stab_entry { char *name; int c_ext; enum sym_type type; }  %% +if,		0,	st_C_ignore +for,		0,	st_C_ignore +while,		0,	st_C_ignore +switch,		0,	st_C_ignore +return,		0,	st_C_ignore  @interface,	0,	st_C_objprot  @protocol,	0,	st_C_objprot  @implementation,0,	st_C_objimpl @@ -1633,14 +1885,17 @@ package,	C_JAVA,	st_C_ignore  friend,		C_PLPL,	st_C_ignore  extends,  	C_JAVA,	st_C_javastruct  implements,  	C_JAVA,	st_C_javastruct +interface,	C_JAVA, st_C_struct  class,  	C_PLPL,	st_C_struct  namespace,	C_PLPL,	st_C_struct  domain, 	C_STAR,	st_C_struct  union,  	0,	st_C_struct  struct, 	0,	st_C_struct +extern,  	0,	st_C_extern  enum,    	0,	st_C_enum  typedef, 	0,	st_C_typedef  define,  	0,	st_C_define +operator,	C_PLPL, st_C_operator  bool,		C_PLPL,	st_C_typespec  long,    	0,	st_C_typespec  short,   	0,	st_C_typespec @@ -1652,7 +1907,6 @@ signed,  	0,	st_C_typespec  unsigned,	0,	st_C_typespec  auto,    	0,	st_C_typespec  void,    	0,	st_C_typespec -extern,  	0,	st_C_typespec  static,  	0,	st_C_typespec  const,   	0,	st_C_typespec  volatile,	0,	st_C_typespec @@ -1671,137 +1925,168 @@ PSEUDO,		0,	st_C_gnumacro  %]  and replace lines between %< and %> with its output. */  /*%<*/ -/* starting time is 10:31:16 */ -/* C code produced by gperf version 2.1 (K&R C version) */ +/* C code produced by gperf version 2.7.1 (19981006 egcs) */  /* Command-line: gperf -c -k 1,3 -o -p -r -t  */ - -  struct C_stab_entry { char *name; int c_ext; enum sym_type type; }; -#define MIN_WORD_LENGTH 3 +#define TOTAL_KEYWORDS 46 +#define MIN_WORD_LENGTH 2  #define MAX_WORD_LENGTH 15 -#define MIN_HASH_VALUE 15 -#define MAX_HASH_VALUE 128 -/* -   39 keywords -  114 is the maximum key range -*/ +#define MIN_HASH_VALUE 13 +#define MAX_HASH_VALUE 123 +/* maximum key range = 111, duplicates = 0 */ -static int +#ifdef __GNUC__ +__inline +#endif +static unsigned int  hash (str, len) -     register char *str; -     register unsigned int  len; +     register const char *str; +     register unsigned int len;  { -  static unsigned char hash_table[] = +  static unsigned char asso_values[] =      { -     128, 128, 128, 128, 128, 128, 128, 128, 128, 128, -     128, 128, 128, 128, 128, 128, 128, 128, 128, 128, -     128, 128, 128, 128, 128, 128, 128, 128, 128, 128, -     128, 128, 128, 128, 128, 128, 128, 128, 128, 128, -     128, 128, 128, 128, 128, 128, 128, 128, 128, 128, -     128, 128, 128, 128, 128, 128, 128, 128, 128, 128, -     128, 128, 128, 128,  39, 128, 128, 128,  54,  48, -      46, 128, 128, 128, 128, 128, 128, 128, 128, 128, -      28, 128, 128,  40,  32, 128, 128, 128, 128, 128, -     128, 128, 128, 128, 128, 128, 128,  24,  30,  47, -      62,   7,  60,  27, 128,  60, 128, 128,  59,  16, -      31,  23,  45, 128,   4,  14,   2,  55,   5, 128, -     128, 128, 128, 128, 128, 128, 128, 128, -  }; -  return len + hash_table[str[2]] + hash_table[str[0]]; +      124, 124, 124, 124, 124, 124, 124, 124, 124, 124, +      124, 124, 124, 124, 124, 124, 124, 124, 124, 124, +      124, 124, 124, 124, 124, 124, 124, 124, 124, 124, +      124, 124, 124, 124, 124, 124, 124, 124, 124, 124, +      124, 124, 124, 124, 124, 124, 124, 124, 124, 124, +      124, 124, 124, 124, 124, 124, 124, 124, 124, 124, +      124, 124, 124, 124,   3, 124, 124, 124,  43,   6, +       11, 124, 124, 124, 124, 124, 124, 124, 124, 124, +       11, 124, 124,  58,   7, 124, 124, 124, 124, 124, +      124, 124, 124, 124, 124, 124, 124,  57,   7,  42, +        4,  14,  52,   0, 124,  53, 124, 124,  29,  11, +        6,  35,  32, 124,  29,  34,  59,  58,  51,  24, +      124, 124, 124, 124, 124, 124, 124, 124, 124, 124, +      124, 124, 124, 124, 124, 124, 124, 124, 124, 124, +      124, 124, 124, 124, 124, 124, 124, 124, 124, 124, +      124, 124, 124, 124, 124, 124, 124, 124, 124, 124, +      124, 124, 124, 124, 124, 124, 124, 124, 124, 124, +      124, 124, 124, 124, 124, 124, 124, 124, 124, 124, +      124, 124, 124, 124, 124, 124, 124, 124, 124, 124, +      124, 124, 124, 124, 124, 124, 124, 124, 124, 124, +      124, 124, 124, 124, 124, 124, 124, 124, 124, 124, +      124, 124, 124, 124, 124, 124, 124, 124, 124, 124, +      124, 124, 124, 124, 124, 124, 124, 124, 124, 124, +      124, 124, 124, 124, 124, 124, 124, 124, 124, 124, +      124, 124, 124, 124, 124, 124, 124, 124, 124, 124, +      124, 124, 124, 124, 124, 124 +    }; +  register int hval = len; + +  switch (hval) +    { +      default: +      case 3: +        hval += asso_values[(unsigned char)str[2]]; +      case 2: +      case 1: +        hval += asso_values[(unsigned char)str[0]]; +        break; +    } +  return hval;  } +#ifdef __GNUC__ +__inline +#endif  struct C_stab_entry *  in_word_set (str, len) -     register char *str; +     register const char *str;       register unsigned int len;  { - -  static struct C_stab_entry  wordlist[] = +  static struct C_stab_entry wordlist[] =      { -      {"",}, {"",}, {"",}, {"",}, {"",}, {"",}, {"",}, {"",}, {"",},  -      {"",}, {"",}, {"",}, {"",}, {"",}, {"",},  -      {"extern",   	0,	st_C_typespec}, -      {"extends",   	C_JAVA,	st_C_javastruct}, -      {"",}, {"",}, {"",}, {"",}, {"",}, {"",}, {"",},  -      {"struct",  	0,	st_C_struct}, -      {"mutable", 	C_PLPL,	st_C_typespec}, -      {"",}, {"",}, {"",}, {"",},  -      {"auto",     	0,	st_C_typespec}, -      {"",}, {"",}, {"",}, {"",}, {"",}, {"",}, {"",}, {"",}, {"",},  -      {"",}, {"",},  -      {"short",    	0,	st_C_typespec}, -      {"",},  -      {"static",   	0,	st_C_typespec}, -      {"",}, {"",},  -      {"signed",   	0,	st_C_typespec}, -      {"",}, {"",}, {"",}, {"",},  -      {"@protocol", 	0,	st_C_objprot}, -      {"",},  -      {"typedef",  	0,	st_C_typedef}, -      {"typename", 	C_PLPL,	st_C_typespec}, -      {"namespace", 	C_PLPL,	st_C_struct}, -      {"bool", 		C_PLPL,	st_C_typespec}, -      {"",}, {"",},  -      {"explicit", 	C_PLPL,	st_C_typespec}, -      {"",}, {"",}, {"",}, {"",},  -      {"int",      	0,	st_C_typespec}, -      {"enum",     	0,	st_C_enum}, -      {"",}, {"",},  -      {"void",     	0,	st_C_typespec}, -      {"@implementation", 0,	st_C_objimpl}, -      {"",},  -      {"volatile", 	0,	st_C_typespec}, -      {"",},  -      {"@end", 		0,	st_C_objend}, -      {"char",     	0,	st_C_typespec}, -      {"class",   	C_PLPL,	st_C_struct}, -      {"unsigned", 	0,	st_C_typespec}, -      {"",}, {"",},  -      {"@interface", 	0,	st_C_objprot}, -      {"",},  -      {"PSEUDO", 		0,	st_C_gnumacro}, -      {"const",    	0,	st_C_typespec}, -      {"domain",  	C_STAR,	st_C_struct}, -      {"ENTRY", 		0,	st_C_gnumacro}, -      {"",},  -      {"SYSCALL", 	0,	st_C_gnumacro}, -      {"float",    	0,	st_C_typespec}, -      {"",}, {"",}, {"",}, {"",}, {"",},  -      {"long",     	0,	st_C_typespec}, -      {"",}, {"",}, {"",}, {"",},  -      {"package", 	C_JAVA,	st_C_ignore}, -      {"",}, {"",}, {"",}, {"",}, {"",},  -      {"DEFUN", 		0,	st_C_gnumacro}, -      {"",}, {"",}, {"",}, {"",}, {"",},  -      {"import", 		C_JAVA,	st_C_ignore}, -      {"",}, {"",}, {"",},  -      {"implements",   	C_JAVA,	st_C_javastruct}, -      {"",}, {"",}, {"",}, {"",},  -      {"union",   	0,	st_C_struct}, -      {"",}, {"",},  -      {"double",   	0,	st_C_typespec}, -      {"",}, {"",},  -      {"friend", 		C_PLPL,	st_C_ignore}, -      {"",},  -      {"define",   	0,	st_C_define}, +      {""}, {""}, {""}, {""}, {""}, {""}, {""}, {""}, {""}, +      {""}, {""}, {""}, {""}, +      {"@end",		0,	st_C_objend}, +      {""}, {""}, {""}, {""}, +      {"ENTRY",		0,	st_C_gnumacro}, +      {"@interface",	0,	st_C_objprot}, +      {""}, +      {"domain", 	C_STAR,	st_C_struct}, +      {""}, +      {"PSEUDO",		0,	st_C_gnumacro}, +      {""}, {""}, +      {"namespace",	C_PLPL,	st_C_struct}, +      {""}, {""}, +      {"@implementation",0,	st_C_objimpl}, +      {""}, {""}, {""}, {""}, {""}, {""}, {""}, {""}, {""}, +      {"long",    	0,	st_C_typespec}, +      {"signed",  	0,	st_C_typespec}, +      {"@protocol",	0,	st_C_objprot}, +      {""}, {""}, {""}, {""}, +      {"bool",		C_PLPL,	st_C_typespec}, +      {""}, {""}, {""}, {""}, {""}, {""}, +      {"const",   	0,	st_C_typespec}, +      {"explicit",	C_PLPL,	st_C_typespec}, +      {"if",		0,	st_C_ignore}, +      {""}, +      {"operator",	C_PLPL, st_C_operator}, +      {""}, +      {"DEFUN",		0,	st_C_gnumacro}, +      {""}, {""}, +      {"define",  	0,	st_C_define}, +      {""}, {""}, {""}, {""}, {""}, +      {"double",  	0,	st_C_typespec}, +      {"struct", 	0,	st_C_struct}, +      {""}, {""}, {""}, {""}, +      {"short",   	0,	st_C_typespec}, +      {""}, +      {"enum",    	0,	st_C_enum}, +      {"mutable",	C_PLPL,	st_C_typespec}, +      {""}, +      {"extern",  	0,	st_C_extern}, +      {"extends",  	C_JAVA,	st_C_javastruct}, +      {"package",	C_JAVA,	st_C_ignore}, +      {"while",		0,	st_C_ignore}, +      {""}, +      {"for",		0,	st_C_ignore}, +      {""}, {""}, {""}, +      {"volatile",	0,	st_C_typespec}, +      {""}, {""}, +      {"import",		C_JAVA,	st_C_ignore}, +      {"float",   	0,	st_C_typespec}, +      {"switch",		0,	st_C_ignore}, +      {"return",		0,	st_C_ignore}, +      {"implements",  	C_JAVA,	st_C_javastruct}, +      {""}, +      {"static",  	0,	st_C_typespec}, +      {"typedef", 	0,	st_C_typedef}, +      {"typename",	C_PLPL,	st_C_typespec}, +      {"unsigned",	0,	st_C_typespec}, +      {""}, {""}, +      {"char",    	0,	st_C_typespec}, +      {"class",  	C_PLPL,	st_C_struct}, +      {""}, {""}, {""}, +      {"void",    	0,	st_C_typespec}, +      {""}, {""}, +      {"friend",		C_PLPL,	st_C_ignore}, +      {""}, {""}, {""}, +      {"int",     	0,	st_C_typespec}, +      {"union",  	0,	st_C_struct}, +      {""}, {""}, {""}, +      {"auto",    	0,	st_C_typespec}, +      {"interface",	C_JAVA, st_C_struct}, +      {""}, +      {"SYSCALL",	0,	st_C_gnumacro}      };    if (len <= MAX_WORD_LENGTH && len >= MIN_WORD_LENGTH)      {        register int key = hash (str, len); -      if (key <= MAX_HASH_VALUE && key >= MIN_HASH_VALUE) +      if (key <= MAX_HASH_VALUE && key >= 0)          { -          register char *s = wordlist[key].name; +          register const char *s = wordlist[key].name; -          if (*s == *str && !strncmp (str + 1, s + 1, len - 1)) +          if (*str == *s && !strncmp (str + 1, s + 1, len - 1))              return &wordlist[key];          }      }    return 0;  } -/* ending time is 10:31:16 */  /*%>*/  enum sym_type @@ -1824,6 +2109,7 @@ C_symtype (str, len, c_ext)  enum  {    fvnone,			/* nothing seen */ +  foperator,			/* func: operator keyword seen (cplpl) */    fvnameseen,			/* function or variable name seen */    fstartlist,			/* func: just after open parenthesis */    finlist,			/* func: in parameter list */ @@ -1832,6 +2118,7 @@ enum    vignore			/* var-like: ignore until ';' */  } fvdef; +bool fvextern;			/* func or var: extern keyword seen; */   /*    * typedefs are recognized using a simple finite automaton. @@ -1840,7 +2127,8 @@ enum  enum  {    tnone,			/* nothing seen */ -  ttypedseen,			/* typedef keyword seen */ +  tkeyseen,			/* typedef keyword seen */ +  ttypeseen,			/* defined type seen */    tinbody,			/* inside typedef body */    tend,				/* just before typedef tag */    tignore			/* junk after typedef tag */ @@ -1919,9 +2207,9 @@ typedef struct    int lineno;    long linepos;    char *buffer; -} TOKEN; -TOKEN tok;			/* latest token read */ +} token; +token tok;			/* latest token read */  /*   * Set this to TRUE, and the next token considered is called a function. @@ -1948,11 +2236,6 @@ int methodlen;   *	*IS_FUNC gets TRUE iff the token is a function or #define macro   *	with args.  C_EXT is which language we are looking at.   * - *	In the future we will need some way to adjust where the end of - *	the token is; for instance, implementing the C++ keyword - *	`operator' properly will adjust the end of the token to be after - *	whatever follows `operator'. - *   * Globals   *	fvdef			IN OUT   *	structdef		IN OUT @@ -2018,20 +2301,20 @@ consider_token (str, len, c, c_ext, cblev, parlev, is_func_or_var)        if (toktype == st_C_typedef)  	{  	  if (typedefs) -	    typdef = ttypedseen; +	    typdef = tkeyseen; +	  fvextern = FALSE;  	  fvdef = fvnone;  	  return FALSE;  	}        break; -    case ttypedseen: +    case tkeyseen:        switch (toktype)  	{  	case st_none:  	case st_C_typespec: -	  typdef = tend; -	  break;  	case st_C_struct:  	case st_C_enum: +	  typdef = ttypeseen;  	  break;  	}        /* Do not return here, so the structdef stuff has a chance. */ @@ -2063,10 +2346,9 @@ consider_token (str, len, c, c_ext, cblev, parlev, is_func_or_var)        if (structdef == stagseen)          structdef = scolonseen;        return FALSE; -      break;      case st_C_struct:      case st_C_enum: -      if (typdef == ttypedseen +      if (typdef == tkeyseen  	  || (typedefs_and_cplusplus && cblev == 0 && structdef == snone))  	{  	  structdef = skeyseen; @@ -2087,16 +2369,14 @@ consider_token (str, len, c, c_ext, cblev, parlev, is_func_or_var)        return TRUE;      } -  /* Avoid entering fvdef stuff if typdef is going on. */    if (typdef != tnone) -    { -      definedef = dnone; -      return FALSE; -    } +    definedef = dnone;    /* Detect GNU macros. -     DEFUN note for writers of emacs C code: +     Writers of emacs code are recommended to put the +     first two args of a DEFUN on the same line. +        The DEFUN macro, used in emacs C source code, has a first arg       that is a string (the lisp function name), and a second arg that       is a C function name.  Since etags skips strings, the second arg @@ -2106,8 +2386,7 @@ consider_token (str, len, c, c_ext, cblev, parlev, is_func_or_var)       removing the initial 'F' character and substituting '-' for '_'.       Anyway, this assumes that the conventions of naming lisp       functions will never change.  Currently, this method is not -     implemented, so writers of emacs code are recommended to put the -     first two args of a DEFUN on the same line. */ +     implemented. */    if (definedef == dnone && toktype == st_C_gnumacro)      {        next_token_is_func = TRUE; @@ -2196,14 +2475,28 @@ consider_token (str, len, c, c_ext, cblev, parlev, is_func_or_var)    /* A function, variable or enum constant? */    switch (toktype)      { +    case st_C_extern: +      fvextern = TRUE; +      /* FALLTHRU */      case st_C_typespec: -      if (fvdef != finlist && fvdef != fignore  && fvdef != vignore) -        fvdef = fvnone;		/* should be useless */ +      if (fvdef != finlist && fvdef != fignore && fvdef != vignore) +	fvdef = fvnone;		/* should be useless */        return FALSE;      case st_C_ignore: +      fvextern = FALSE;        fvdef = vignore;        return FALSE; +    case st_C_operator: +      fvdef = foperator; +      *is_func_or_var = TRUE; +      return TRUE;      case st_none: +      if ((c_ext & C_PLPL) && strneq (str+len-10, "::operator", 10)) +	{ +	  fvdef = foperator; +	  *is_func_or_var = TRUE; +	  return TRUE; +	}        if (constantypedefs && structdef == sinbody && structtype == st_C_enum)  	return TRUE;        if (fvdef == fvnone) @@ -2212,6 +2505,7 @@ consider_token (str, len, c, c_ext, cblev, parlev, is_func_or_var)  	  *is_func_or_var = TRUE;  	  return TRUE;  	} +      break;      }    return FALSE; @@ -2221,7 +2515,7 @@ consider_token (str, len, c, c_ext, cblev, parlev, is_func_or_var)   * C_entries ()   *	This routine finds functions, variables, typedefs,   * 	#define's, enum constants and struct/union/enum definitions in - * 	#C syntax and adds them to the list. + * 	C syntax and adds them to the list.   */  #define current_lb_is_new (newndx == curndx)  #define switch_line_buffers() (curndx = 1 - curndx) @@ -2233,7 +2527,7 @@ consider_token (str, len, c, c_ext, cblev, parlev, is_func_or_var)  #define othlinepos (lbs[1-curndx].linepos)  #define newlinepos (lbs[newndx].linepos) -#define CNL_SAVE_DEFINEDEF						\ +#define CNL_SAVE_DEFINEDEF()						\  do {									\    curlinepos = charno;							\    lineno++;								\ @@ -2244,9 +2538,9 @@ do {									\    newndx = curndx;							\  } while (0) -#define CNL								\ +#define CNL()								\  do {									\ -  CNL_SAVE_DEFINEDEF;							\ +  CNL_SAVE_DEFINEDEF();							\    if (savetok.valid)							\      {									\        tok = savetok;							\ @@ -2300,23 +2594,25 @@ C_entries (c_ext, inf)    int cblev;			/* current curly brace level */    int parlev;			/* current parenthesis level */    bool incomm, inquote, inchar, quotednl, midtoken; -  bool cplpl, cjava; -  TOKEN savetok;		/* token saved during preprocessor handling */ +  bool purec, cplpl, cjava; +  token savetok;		/* token saved during preprocessor handling */ +  tokoff = toklen = 0;		/* keep compiler quiet */    curndx = newndx = 0;    lineno = 0;    charno = 0;    lp = curlb.buffer;    *lp = 0; -  fvdef = fvnone; typdef = tnone; structdef = snone; -  definedef = dnone; objdef = onone; +  fvdef = fvnone; fvextern = FALSE; typdef = tnone; +  structdef = snone; definedef = dnone; objdef = onone;    next_token_is_func = yacc_rules = FALSE;    midtoken = inquote = inchar = incomm = quotednl = FALSE;    tok.valid = savetok.valid = FALSE;    cblev = 0;    parlev = 0; +  purec = !(c_ext & ~YACC);	/* no extensions (apart from possibly yacc) */    cplpl = (c_ext & C_PLPL) == C_PLPL;    cjava = (c_ext & C_JAVA) == C_JAVA;    if (cjava) @@ -2354,7 +2650,7 @@ C_entries (c_ext, inf)  	    case '\0':  	      /* Newlines inside comments do not end macro definitions in  		 traditional cpp. */ -	      CNL_SAVE_DEFINEDEF; +	      CNL_SAVE_DEFINEDEF ();  	      break;  	    }  	  continue; @@ -2370,7 +2666,7 @@ C_entries (c_ext, inf)  	      /* Newlines inside strings do not end macro definitions  		 in traditional cpp, even though compilers don't  		 usually accept them. */ -	      CNL_SAVE_DEFINEDEF; +	      CNL_SAVE_DEFINEDEF ();  	      break;  	    }  	  continue; @@ -2381,7 +2677,7 @@ C_entries (c_ext, inf)  	    {  	    case '\0':  	      /* Hmmm, something went wrong. */ -	      CNL; +	      CNL ();  	      /* FALLTHRU */  	    case '\'':  	      inchar = FALSE; @@ -2395,12 +2691,18 @@ C_entries (c_ext, inf)  	  case '"':  	    inquote = TRUE;  	    if (fvdef != finlist && fvdef != fignore && fvdef !=vignore) -	      fvdef = fvnone; +	      { +		fvextern = FALSE; +		fvdef = fvnone; +	      }  	    continue;  	  case '\'':  	    inchar = TRUE;  	    if (fvdef != finlist && fvdef != fignore && fvdef !=vignore) -	      fvdef = fvnone; +	      { +		fvextern = FALSE; +		fvdef = fvnone; +	      }  	    continue;  	  case '/':  	    if (*lp == '*') @@ -2421,7 +2723,7 @@ C_entries (c_ext, inf)  	      {  		/* entering or exiting rules section in yacc file */  		lp++; -		definedef = dnone; fvdef = fvnone; +		definedef = dnone; fvdef = fvnone; fvextern = FALSE;  		typdef = tnone; structdef = snone;  		next_token_is_func = FALSE;  		midtoken = inquote = inchar = incomm = quotednl = FALSE; @@ -2463,7 +2765,7 @@ C_entries (c_ext, inf)        if ((definedef != dnone  	   || (cblev == 0 && structdef != scolonseen)  	   || (cblev == 1 && cplpl && structdef == sinbody) -	   || (structdef == sinbody && structtype == st_C_enum)) +	   || (structdef == sinbody && purec))  	  && typdef != tignore  	  && definedef != dignorerest  	  && fvdef != finlist) @@ -2472,27 +2774,43 @@ C_entries (c_ext, inf)  	    {  	      if (endtoken (c))  		{ -		  if (c == ':' && cplpl && *lp == ':' && begtoken(*(lp + 1))) +		  bool funorvar = FALSE; + +		  if (c == ':' && cplpl && *lp == ':' && begtoken (lp[1]))  		    {  		      /*  		       * This handles :: in the middle, but not at the -		       * beginning of an identifier. +		       * beginning of an identifier.  Also, space-separated +		       * :: is not recognised.  		       */  		      lp += 2; -		      toklen += 3; +		      toklen += 2; +		      c = lp[-1]; +		      goto intoken;  		    }  		  else  		    { -		      bool funorvar = FALSE; -  		      if (yacc_rules  			  || consider_token (newlb.buffer + tokoff, toklen, c,  					     c_ext, cblev, parlev, &funorvar))  			{ +			  if (fvdef == foperator) +			    { +			      char *oldlp = lp; +			      lp = skip_spaces (lp-1); +			      if (*lp != '\0') +				lp += 1; +			      while (*lp != '\0' +				     && !isspace (*lp) && *lp != '(') +				lp += 1; +			      c = *lp++; +			      toklen += lp - oldlp; +			    }  			  tok.named = FALSE; -			  if (structdef == sinbody +			  if (!purec +			      && funorvar  			      && definedef == dnone -			      && funorvar) +			      && structdef == sinbody)  			    /* function or var defined in C++ class body */  			    {  			      int len = strlen (structtag) + qlen + toklen; @@ -2530,11 +2848,15 @@ C_entries (c_ext, inf)  				       newlb.buffer + tokoff, toklen);  			      token_name.buffer[toklen] = '\0';  			      token_name.len = toklen; -			      /* Name macros. */ +			      /* Name macros and members. */  			      tok.named = (structdef == stagseen +					   || typdef == ttypeseen  					   || typdef == tend  					   || (funorvar -					       && definedef == dignorerest)); +					       && definedef == dignorerest) +					   || (funorvar +					       && definedef == dnone +					       && structdef == sinbody));  			    }  			  tok.lineno = lineno;  			  tok.linelen = tokoff + toklen + 1; @@ -2544,6 +2866,7 @@ C_entries (c_ext, inf)  			  if (definedef == dnone  			      && (fvdef == fvnameseen +				  || fvdef == foperator  				  || structdef == stagseen  				  || typdef == tend  				  || objdef != onone)) @@ -2558,6 +2881,7 @@ C_entries (c_ext, inf)  		    }  		} /* if (endtoken (c)) */  	      else if (intoken (c)) +		intoken:  		{  		  toklen++;  		  continue; @@ -2633,6 +2957,7 @@ C_entries (c_ext, inf)  		  }  		break;  	      case fstartlist: +		fvextern = FALSE;  		fvdef = fvnone;  		break;  	      } @@ -2654,10 +2979,19 @@ C_entries (c_ext, inf)  	    case fignore:  	      break;  	    case fvnameseen: -	      if ((globals && cblev == 0) || (members && cblev == 1)) +	      if ((members && cblev == 1) +		  || (globals && cblev == 0 && (!fvextern || declarations)))  		make_C_tag (FALSE); /* a variable */ +	      fvextern = FALSE; +	      fvdef = fvnone; +	      tok.valid = FALSE; +	      break; +	    case flistseen: +	      if (declarations && (cblev == 0 || cblev == 1)) +		make_C_tag (TRUE); /* a function declaration */  	      /* FALLTHRU */  	    default: +	      fvextern = FALSE;  	      fvdef = fvnone;  	      /* The following instruction invalidates the token.  		 Probably the token should be invalidated in all @@ -2680,12 +3014,14 @@ C_entries (c_ext, inf)  	    }  	  switch (fvdef)  	    { +	    case foperator:  	    case finlist:  	    case fignore:  	    case vignore:  	      break;  	    case fvnameseen: -	      if ((globals && cblev == 0) || (members && cblev == 1)) +	      if ((members && cblev == 1) +		  || (globals && cblev == 0 && (!fvextern || declarations)))  		make_C_tag (FALSE); /* a variable */  	      break;  	    default: @@ -2705,12 +3041,14 @@ C_entries (c_ext, inf)  	    }  	  switch (fvdef)  	    { +	    case foperator:  	    case finlist:  	    case fignore:  	    case vignore:  	      break;  	    case fvnameseen: -	      if ((globals && cblev == 0) || (members && cblev == 1)) +	      if ((members && cblev == 1) +		  || (globals && cblev == 0 && (!fvextern || declarations)))  		make_C_tag (FALSE); /* a variable */  	      /* FALLTHRU */  	    default: @@ -2726,22 +3064,19 @@ C_entries (c_ext, inf)  	    objdef = oparenseen;  	  switch (fvdef)  	    { -	    case fvnone: -	      switch (typdef) -		{ -		case ttypedseen: -		case tend: -		  if (tok.valid && *lp != '*') -		    { -		      /* This handles constructs like: -			 typedef void OperatorFun (int fun); */ -		      make_C_tag (FALSE); -		      typdef = tignore; -		    } -		  break; -		} /* switch (typdef) */ -	      break;  	    case fvnameseen: +	      if (typdef == ttypeseen +		  && tok.valid +		  && *lp != '*' +		  && structdef != sinbody) +		{ +		  /* This handles constructs like: +		     typedef void OperatorFun (int fun); */ +		  make_C_tag (FALSE); +		  typdef = tignore; +		} +	      /* FALLTHRU */ +	    case foperator:  	      fvdef = fstartlist;  	      break;  	    case flistseen: @@ -2767,7 +3102,7 @@ C_entries (c_ext, inf)  		  fvdef = flistseen;  		  break;  		} -	      if (cblev == 0 && typdef == tend) +	      if (cblev == 0 && (typdef == tend))  		{  		  typdef = tignore;  		  make_C_tag (FALSE); /* a typedef */ @@ -2779,7 +3114,7 @@ C_entries (c_ext, inf)  	case '{':  	  if (definedef != dnone)  	    break; -	  if (typdef == ttypedseen) +	  if (typdef == ttypeseen)  	    typdef = tinbody;  	  switch (structdef)  	    { @@ -2858,12 +3193,14 @@ C_entries (c_ext, inf)  	    break;  	  switch (fvdef)  	    { +	    case foperator:  	    case finlist:  	    case fignore:  	    case vignore:  	      break;  	    case fvnameseen: -	      if ((globals && cblev == 0) || (members && cblev == 1)) +	      if ((members && cblev == 1) +		  || (globals && cblev == 0 && (!fvextern || declarations)))  		make_C_tag (FALSE); /* a variable */  	      /* FALLTHRU */  	    default: @@ -2882,9 +3219,17 @@ C_entries (c_ext, inf)  	case '^': case '!': case '<': case '>': case '.': case '?': case ']':  	  if (definedef != dnone)  	    break; -	  /* These surely cannot follow a function tag. */ -	  if (fvdef != finlist && fvdef != fignore && fvdef != vignore) -	    fvdef = fvnone; +	  /* These surely cannot follow a function tag in C. */ +	  switch (fvdef) +	    { +	    case foperator: +	    case finlist: +	    case fignore: +	    case vignore: +	      break; +	    default: +	      fvdef = fvnone; +	    }  	  break;  	case '\0':  	  if (objdef == otagseen) @@ -2894,9 +3239,9 @@ C_entries (c_ext, inf)  	    }  	  /* If a macro spans multiple lines don't reset its state. */  	  if (quotednl) -	    CNL_SAVE_DEFINEDEF; +	    CNL_SAVE_DEFINEDEF ();  	  else -	    CNL; +	    CNL ();  	  break;  	} /* switch (c) */ @@ -2954,9 +3299,33 @@ Yacc_entries (inf)    C_entries (YACC, inf);  } -/* Fortran parsing */ +/* A useful macro. */ +#define LOOP_ON_INPUT_LINES(file_pointer, line_buffer, char_pointer)	\ +  for (lineno = charno = 0;	/* loop initialization */		\ +       !feof (file_pointer)	/* loop test */				\ +       && (lineno++,		/* instructions at start of loop */	\ +	   linecharno = charno,						\ +	   charno += readline (&line_buffer, file_pointer),		\ +	   char_pointer = lb.buffer,					\ +	   TRUE);							\ +      ) + + +/* + * Read a file, but do no processing.  This is used to do regexp + * matching on files that have no language defined. + */ +void +just_read_file (inf) +     FILE *inf; +{ +  register char *dummy; -char *dbp; +  LOOP_ON_INPUT_LINES (inf, lb, dummy) +    continue; +} + +/* Fortran parsing */  bool  tail (cp) @@ -2964,9 +3333,9 @@ tail (cp)  {    register int len = 0; -  while (*cp && lowcase(*cp) == lowcase(dbp[len])) +  while (*cp != '\0' && lowcase (*cp) == lowcase (dbp[len]))      cp++, len++; -  if (*cp == '\0' && !intoken(dbp[len])) +  if (*cp == '\0' && !intoken (dbp[len]))      {        dbp += len;        return TRUE; @@ -2977,13 +3346,11 @@ tail (cp)  void  takeprec ()  { -  while (isspace (*dbp)) -    dbp++; +  dbp = skip_spaces (dbp);    if (*dbp != '*')      return;    dbp++; -  while (isspace (*dbp)) -    dbp++; +  dbp = skip_spaces (dbp);    if (strneq (dbp, "(*)", 3))      {        dbp += 3; @@ -3005,8 +3372,7 @@ getit (inf)  {    register char *cp; -  while (isspace (*dbp)) -    dbp++; +  dbp = skip_spaces (dbp);    if (*dbp == '\0')      {        lineno++; @@ -3016,39 +3382,26 @@ getit (inf)        if (dbp[5] != '&')  	return;        dbp += 6; -      while (isspace (*dbp)) -	dbp++; +      dbp = skip_spaces (dbp);      } -  if (!isalpha (*dbp) -      && *dbp != '_' -      && *dbp != '$') +  if (!isalpha (*dbp) && *dbp != '_' && *dbp != '$')      return; -  for (cp = dbp + 1; -       (*cp -	&& (isalpha (*cp) || isdigit (*cp) || (*cp == '_') || (*cp == '$'))); -       cp++) +  for (cp = dbp + 1; *cp != '\0' && intoken (*cp); cp++)      continue;    pfnote (savenstr (dbp, cp-dbp), TRUE,  	  lb.buffer, cp - lb.buffer + 1, lineno, linecharno);  } +  void  Fortran_functions (inf)       FILE *inf;  { -  lineno = 0; -  charno = 0; - -  while (!feof (inf)) +  LOOP_ON_INPUT_LINES (inf, lb, dbp)      { -      lineno++; -      linecharno = charno; -      charno += readline (&lb, inf); -      dbp = lb.buffer;        if (*dbp == '%')  	dbp++;			/* Ratfor escape to fortran */ -      while (isspace (*dbp)) -	dbp++; +      dbp = skip_spaces (dbp);        if (*dbp == '\0')  	continue;        switch (lowcase (*dbp)) @@ -3072,8 +3425,7 @@ Fortran_functions (inf)  	case 'd':  	  if (tail ("double"))  	    { -	      while (isspace (*dbp)) -		dbp++; +	      dbp = skip_spaces (dbp);  	      if (*dbp == '\0')  		continue;  	      if (tail ("precision")) @@ -3082,8 +3434,7 @@ Fortran_functions (inf)  	    }  	  break;  	} -      while (isspace (*dbp)) -	dbp++; +      dbp = skip_spaces (dbp);        if (*dbp == '\0')  	continue;        switch (lowcase (*dbp)) @@ -3100,23 +3451,13 @@ Fortran_functions (inf)  	  if (tail ("entry"))  	    getit (inf);  	  continue; -	case 'p': -	  if (tail ("program")) -	    { -	      getit (inf); -	      continue; -	    } -	  if (tail ("procedure")) -	    getit (inf); -	  continue;  	case 'b':  	  if (tail ("blockdata") || tail ("block data"))  	    { -	      while (isspace (*dbp)) -		dbp++; +	      dbp = skip_spaces (dbp);  	      if (*dbp == '\0')	/* assume un-named */ -		pfnote (savestr ("blockdata"), TRUE, lb.buffer, -			dbp - lb.buffer, lineno, linecharno); +		pfnote (savestr ("blockdata"), TRUE, +			lb.buffer, dbp - lb.buffer, lineno, linecharno);  	      else  		getit (inf);	/* look for name */  	    } @@ -3126,6 +3467,171 @@ Fortran_functions (inf)  }  /* + * Philippe Waroquiers <philippe.waroquiers@eurocontrol.be>, 1998-04-24 + * Ada parsing + */ +/* Once we are positioned after an "interesting" keyword, let's get +   the real tag value necessary. */ +void +adagetit (inf, name_qualifier) +     FILE *inf; +     char *name_qualifier; +{ +  register char *cp; +  char *name; +  char c; + +  while (!feof (inf)) +    { +      dbp = skip_spaces (dbp); +      if (*dbp == '\0' +	  || (dbp[0] == '-' && dbp[1] == '-')) +	{ +	  lineno++; +	  linecharno = charno; +	  charno += readline (&lb, inf); +	  dbp = lb.buffer; +	} +      switch (*dbp) +        { +        case 'b': +        case 'B': +          if (tail ("body")) +            { +              /* Skipping body of   procedure body   or   package body or .... +		 resetting qualifier to body instead of spec. */ +              name_qualifier = "/b"; +              continue; +            } +          break; +        case 't': +        case 'T': +          /* Skipping type of   task type   or   protected type ... */ +          if (tail ("type")) +            continue; +          break; +        } +      if (*dbp == '"') +	{ +	  dbp += 1; +	  for (cp = dbp; *cp != '\0' && *cp != '"'; cp++) +	    continue; +	} +      else +	{ +	  dbp = skip_spaces (dbp); +	  for (cp = dbp; +	       (*cp != '\0' +		&& (isalpha (*cp) || isdigit (*cp) || *cp == '_' || *cp == '.')); +	       cp++) +	    continue; +	  if (cp == dbp) +	    return; +	} +      c = *cp; +      *cp = '\0'; +      name = concat (dbp, name_qualifier, ""); +      *cp = c; +      pfnote (name, TRUE, lb.buffer, cp - lb.buffer + 1, lineno, linecharno); +      if (c == '"') +	dbp = cp + 1; +      return; +    } +} + +void +Ada_funcs (inf) +     FILE *inf; +{ +  bool inquote = FALSE; + +  LOOP_ON_INPUT_LINES (inf, lb, dbp) +    { +      while (*dbp != '\0') +	{ +	  /* Skip a string i.e. "abcd". */ +	  if (inquote || (*dbp == '"')) +	    { +	      dbp = etags_strchr ((inquote) ? dbp : dbp+1, '"'); +	      if (dbp != NULL) +		{ +		  inquote = FALSE; +		  dbp += 1; +		  continue;	/* advance char */ +		} +	      else +		{ +		  inquote = TRUE; +		  break;	/* advance line */ +		} +	    } + +	  /* Skip comments. */ +	  if (dbp[0] == '-' && dbp[1] == '-') +	    break;		/* advance line */ + +	  /* Skip character enclosed in single quote i.e. 'a' +	     and skip single quote starting an attribute i.e. 'Image. */ +	  if (*dbp == '\'') +	    { +	      dbp++ ; +	      if (*dbp != '\0') +		dbp++; +	      continue; +	    } + +	  /* Search for beginning of a token.  */ +	  if (!begtoken (*dbp)) +	    { +	      dbp++; +	      continue;		/* advance char */ +	    } + +	  /* We are at the beginning of a token. */ +	  switch (*dbp) +	    { +	    case 'f': +	    case 'F': +	      if (!packages_only && tail ("function")) +		adagetit (inf, "/f"); +	      else +		break;		/* from switch */ +	      continue;		/* advance char */ +	    case 'p': +	    case 'P': +	      if (!packages_only && tail ("procedure")) +		adagetit (inf, "/p"); +	      else if (tail ("package")) +		adagetit (inf, "/s"); +	      else if (tail ("protected")) /* protected type */ +		adagetit (inf, "/t"); +	      else +		break;		/* from switch */ +	      continue;		/* advance char */ +	    case 't': +	    case 'T': +	      if (!packages_only && tail ("task")) +		adagetit (inf, "/k"); +	      else if (typedefs && !packages_only && tail ("type")) +		{ +		  adagetit (inf, "/t"); +		  while (*dbp != '\0') +		    dbp += 1; +		} +	      else +		break;		/* from switch */ +	      continue;		/* advance char */ +	    } + +	  /* Look for the end of the token. */ +	  while (!endtoken (*dbp)) +	    dbp++; + +	} /* advance char */ +    } /* advance line */ +} + +/*   * Bob Weiner, Motorola Inc., 4/3/94   * Unix and microcontroller assembly tag handling   * look for '^[a-zA-Z_.$][a-zA_Z0-9_.$]*[: ^I^J]' @@ -3136,16 +3642,8 @@ Asm_labels (inf)  {    register char *cp; -  lineno = 0; -  charno = 0; - -  while (!feof (inf)) +  LOOP_ON_INPUT_LINES (inf, lb, cp)      { -      lineno++; -      linecharno = charno; -      charno += readline (&lb, inf); -      cp = lb.buffer; -        /* If first char is alphabetic or one of [_.$], test for colon  	 following identifier. */        if (isalpha (*cp) || *cp == '_' || *cp == '.' || *cp == '$') @@ -3166,7 +3664,9 @@ Asm_labels (inf)  /*   * Perl support by Bart Robinson <lomew@cs.utah.edu> + *              enhanced by Michael Ernst <mernst@alum.mit.edu>   * Perl sub names: look for /^sub[ \t\n]+[^ \t\n{]+/ + * Perl variable names: /^(my|local).../   */  void  Perl_functions (inf) @@ -3174,23 +3674,96 @@ Perl_functions (inf)  {    register char *cp; -  lineno = 0; -  charno = 0; - -  while (!feof (inf)) +  LOOP_ON_INPUT_LINES (inf, lb, cp)      { -      lineno++; -      linecharno = charno; -      charno += readline (&lb, inf); -      cp = lb.buffer; +      if (*cp++ == 's' +	  && *cp++ == 'u' +	  && *cp++ == 'b' && isspace (*cp++)) +	{ +	  cp = skip_spaces (cp); + 	  if (*cp != '\0') + 	    { +	      char *sp = cp; + 	      while (*cp != '\0' +		     && !isspace (*cp) && *cp != '{' && *cp != '(') +		cp++; +	      pfnote (savenstr (sp, cp-sp), TRUE, + 		      lb.buffer, cp - lb.buffer + 1, lineno, linecharno); + 	    } + 	} +       else if (globals		/* only if tagging global vars is enabled */ +		&& ((cp = lb.buffer, +		     *cp++ == 'm' +		     && *cp++ == 'y') +		    || (cp = lb.buffer, +			*cp++ == 'l' +			&& *cp++ == 'o' +			&& *cp++ == 'c' +			&& *cp++ == 'a' +			&& *cp++ == 'l')) +		&& (*cp == '(' || isspace (*cp))) + 	{ + 	  /* After "my" or "local", but before any following paren or space. */ + 	  char *varname = NULL; + + 	  cp = skip_spaces (cp); + 	  if (*cp == '$' || *cp == '@' || *cp == '%') + 	    { + 	      char* varstart = ++cp; + 	      while (isalnum (*cp) || *cp == '_') + 		cp++; + 	      varname = savenstr (varstart, cp-varstart); + 	    } + 	  else + 	    { + 	      /* Should be examining a variable list at this point; + 		 could insist on seeing an open parenthesis. */ + 	      while (*cp != '\0' && *cp != ';' && *cp != '=' &&  *cp != ')') + 		cp++; + 	    } + + 	  /* Perhaps I should back cp up one character, so the TAGS table + 	     doesn't mention (and so depend upon) the following char. */ + 	  pfnote ((CTAGS) ? savenstr (lb.buffer, cp-lb.buffer) : varname, + 		  FALSE, lb.buffer, cp - lb.buffer + 1, lineno, linecharno); +	} +    } +} + +/* + * Python support by Eric S. Raymond <esr@thyrsus.com> + * Look for /^def[ \t\n]+[^ \t\n(:]+/ or /^class[ \t\n]+[^ \t\n(:]+/ + */ +void +Python_functions (inf) +     FILE *inf; +{ +  register char *cp; -      if (*cp++ == 's' && *cp++ == 'u' && *cp++ == 'b' && isspace (*cp++)) +  LOOP_ON_INPUT_LINES (inf, lb, cp) +    { +      if (*cp++ == 'd' +	  && *cp++ == 'e' +	  && *cp++ == 'f' && isspace (*cp++))  	{ -	  while (*cp && isspace (*cp)) +	  cp = skip_spaces (cp); +	  while (*cp != '\0' && !isspace (*cp) && *cp != '(' && *cp != ':')  	    cp++; -	  while (*cp && ! isspace (*cp) && *cp != '{') +	  pfnote (NULL, TRUE, +		  lb.buffer, cp - lb.buffer + 1, lineno, linecharno); +	} + +      cp = lb.buffer; +      if (*cp++ == 'c' +	  && *cp++ == 'l' +	  && *cp++ == 'a' +	  && *cp++ == 's' +	  && *cp++ == 's' && isspace (*cp++)) +	{ +	  cp = skip_spaces (cp); +	  while (*cp != '\0' && !isspace (*cp) && *cp != '(' && *cp != ':')  	    cp++; -	  pfnote (savenstr (lb.buffer, cp-lb.buffer), TRUE, +	  pfnote (NULL, TRUE,  		  lb.buffer, cp - lb.buffer + 1, lineno, linecharno);  	}      } @@ -3205,30 +3778,23 @@ void  Cobol_paragraphs (inf)       FILE *inf;  { -  register char *cp; - -  lineno = 0; -  charno = 0; +  register char *bp, *ep; -  while (!feof (inf)) +  LOOP_ON_INPUT_LINES (inf, lb, bp)      { -      lineno++; -      linecharno = charno; -      charno += readline (&lb, inf); -        if (lb.len < 9)  	continue; -      dbp = lb.buffer + 8; +      bp += 8;        /* If eoln, compiler option or comment ignore whole line. */ -      if (dbp[-1] != ' ' || !isalnum (dbp[0])) +      if (bp[-1] != ' ' || !isalnum (bp[0]))          continue; -      for (cp = dbp; isalnum (*cp) || *cp == '-'; cp++) +      for (ep = bp; isalnum (*ep) || *ep == '-'; ep++)  	continue; -      if (*cp++ == '.') -	pfnote (savenstr (dbp, cp-dbp), TRUE, -		lb.buffer, cp - lb.buffer + 1, lineno, linecharno); +      if (*ep++ == '.') +	pfnote (savenstr (bp, ep-bp), TRUE, +		lb.buffer, ep - lb.buffer + 1, lineno, linecharno);      }  } @@ -3245,7 +3811,7 @@ void  Pascal_functions (inf)       FILE *inf;  { -  struct linebuffer tline;	/* mostly copied from C_entries */ +  linebuffer tline;		/* mostly copied from C_entries */    long save_lcno;    int save_lineno, save_len;    char c, *cp, *namebuf; @@ -3262,11 +3828,12 @@ Pascal_functions (inf)  				   is a FORWARD/EXTERN to be ignored, or  				   whether it is a real tag */ +  save_lcno = save_lineno = save_len = 0; /* keep compiler quiet */ +  namebuf = NULL;		/* keep compiler quiet */    lineno = 0;    charno = 0;    dbp = lb.buffer;    *dbp = '\0'; -  save_len = 0;    initbuffer (&tline);    incomment = inquote = FALSE; @@ -3275,8 +3842,8 @@ Pascal_functions (inf)    inparms = FALSE;		/* found '(' after "proc"            */    verify_tag = FALSE;		/* check if "extern" is ahead        */ -  /* long main loop to get next char */ -  while (!feof (inf)) + +  while (!feof (inf))		/* long main loop to get next char */      {        c = *dbp++;        if (c == '\0')		/* if end of line */ @@ -3287,8 +3854,8 @@ Pascal_functions (inf)  	  dbp = lb.buffer;  	  if (*dbp == '\0')  	    continue; -	  if (!((found_tag && verify_tag) || -		get_tagname)) +	  if (!((found_tag && verify_tag) +		|| get_tagname))  	    c = *dbp++;		/* only if don't need *dbp pointing  				   to the beginning of the name of  				   the procedure or function */ @@ -3430,12 +3997,12 @@ int  L_isquote (strp)       register char *strp;  { -  return ((*(++strp) == 'q' || *strp == 'Q') -	  && (*(++strp) == 'u' || *strp == 'U') -	  && (*(++strp) == 'o' || *strp == 'O') -	  && (*(++strp) == 't' || *strp == 'T') -	  && (*(++strp) == 'e' || *strp == 'E') -	  && isspace (*(++strp))); +  return ((*++strp == 'q' || *strp == 'Q') +	  && (*++strp == 'u' || *strp == 'U') +	  && (*++strp == 'o' || *strp == 'O') +	  && (*++strp == 't' || *strp == 'T') +	  && (*++strp == 'e' || *strp == 'E') +	  && isspace (*++strp));  }  void @@ -3445,14 +4012,17 @@ L_getit ()    if (*dbp == '\'')		/* Skip prefix quote */      dbp++; -  else if (*dbp == '(' && L_isquote (dbp)) /* Skip "(quote " */ +  else if (*dbp == '(')    { -    dbp += 7; -    while (isspace (*dbp)) -      dbp++; +    if (L_isquote (dbp)) +      dbp += 7;			/* Skip "(quote " */ +    else +      dbp += 1;			/* Skip "(" before name in (defstruct (foo)) */ +    dbp = skip_spaces (dbp);    } +    for (cp = dbp /*+1*/; -       *cp != '\0' && *cp != '(' && *cp != ' ' && *cp != ')'; +       *cp != '\0' && *cp != '(' && !isspace(*cp) && *cp != ')';         cp++)      continue;    if (cp == dbp) @@ -3466,23 +4036,14 @@ void  Lisp_functions (inf)       FILE *inf;  { -  lineno = 0; -  charno = 0; - -  while (!feof (inf)) +  LOOP_ON_INPUT_LINES (inf, lb, dbp)      { -      lineno++; -      linecharno = charno; -      charno += readline (&lb, inf); -      dbp = lb.buffer;        if (dbp[0] == '(')  	{  	  if (L_isdef (dbp))  	    { -	      while (!isspace (*dbp)) -		dbp++; -	      while (isspace (*dbp)) -		dbp++; +	      dbp = skip_non_spaces (dbp); +	      dbp = skip_spaces (dbp);  	      L_getit ();  	    }  	  else @@ -3490,7 +4051,7 @@ Lisp_functions (inf)  	      /* Check for (foo::defmumble name-defined ... */  	      do  		dbp++; -	      while (*dbp && !isspace (*dbp) +	      while (*dbp != '\0' && !isspace (*dbp)  		     && *dbp != ':' && *dbp != '(' && *dbp != ')');  	      if (*dbp == ':')  		{ @@ -3500,10 +4061,8 @@ Lisp_functions (inf)  		  if (L_isdef (dbp - 1))  		    { -		      while (!isspace (*dbp)) -			dbp++; -		      while (isspace (*dbp)) -			dbp++; +		      dbp = skip_non_spaces (dbp); +		      dbp = skip_spaces (dbp);  		      L_getit ();  		    }  		} @@ -3516,29 +4075,31 @@ Lisp_functions (inf)   * Postscript tag functions   * Just look for lines where the first character is '/'   * Richard Mlynarik <mly@adoc.xerox.com> + * Also look at "defineps" for PSWrap + * suggested by Masatake YAMATO <masata-y@is.aist-nara.ac.jp>   */ -void  +void  Postscript_functions (inf)       FILE *inf;  { -  lineno = 0; -  charno = 0; +  register char *bp, *ep; -  while (!feof (inf)) +  LOOP_ON_INPUT_LINES (inf, lb, bp)      { -      lineno++; -      linecharno = charno; -      charno += readline (&lb, inf); -      dbp = lb.buffer; -      if (dbp[0] == '/') +      if (bp[0] == '/')  	{ -	  register char *cp; -	  for (cp = dbp+1; -	       *cp != '\0' && *cp != ' ' && *cp != '{'; -	       cp++) +	  for (ep = bp+1; +	       *ep != '\0' && *ep != ' ' && *ep != '{'; +	       ep++)  	    continue; -	  pfnote (savenstr (dbp, cp-dbp), TRUE, -		  lb.buffer, cp - lb.buffer + 1, lineno, linecharno); +	  pfnote (savenstr (bp, ep-bp), TRUE, +		  lb.buffer, ep - lb.buffer + 1, lineno, linecharno); +	} +      else if (strneq (bp, "defineps", 8)) +	{ +	  bp = skip_non_spaces (bp); + 	  bp = skip_spaces (bp); +	  get_tag (bp);  	}      }  } @@ -3558,59 +4119,34 @@ void  Scheme_functions (inf)       FILE *inf;  { -  lineno = 0; -  charno = 0; +  register char *bp; -  while (!feof (inf)) +  LOOP_ON_INPUT_LINES (inf, lb, bp)      { -      lineno++; -      linecharno = charno; -      charno += readline (&lb, inf); -      dbp = lb.buffer; -      if (dbp[0] == '(' && -	  (dbp[1] == 'D' || dbp[1] == 'd') && -	  (dbp[2] == 'E' || dbp[2] == 'e') && -	  (dbp[3] == 'F' || dbp[3] == 'f')) +      if (bp[0] == '(' +	  && (bp[1] == 'D' || bp[1] == 'd') +	  && (bp[2] == 'E' || bp[2] == 'e') +	  && (bp[3] == 'F' || bp[3] == 'f'))  	{ -	  while (!isspace (*dbp)) -	    dbp++; +	  bp = skip_non_spaces (bp);  	  /* Skip over open parens and white space */ -	  while (*dbp && (isspace (*dbp) || *dbp == '(')) -	    dbp++; -	  get_scheme (); +	  while (isspace (*bp) || *bp == '(') +	    bp++; +	  get_tag (bp);  	} -      if (dbp[0] == '(' && -	  (dbp[1] == 'S' || dbp[1] == 's') && -	  (dbp[2] == 'E' || dbp[2] == 'e') && -	  (dbp[3] == 'T' || dbp[3] == 't') && -	  (dbp[4] == '!' || dbp[4] == '!') && -	  (isspace (dbp[5]))) +      if (bp[0] == '(' +	  && (bp[1] == 'S' || bp[1] == 's') +	  && (bp[2] == 'E' || bp[2] == 'e') +	  && (bp[3] == 'T' || bp[3] == 't') +	  && (bp[4] == '!' || bp[4] == '!') +	  && (isspace (bp[5])))  	{ -	  while (!isspace (*dbp)) -	    dbp++; -	  /* Skip over white space */ -	  while (isspace (*dbp)) -	    dbp++; -	  get_scheme (); +	  bp = skip_non_spaces (bp); +	  bp = skip_spaces (bp); +	  get_tag (bp);  	}      }  } - -void -get_scheme () -{ -  register char *cp; - -  if (*dbp == '\0') -    return; -  /* Go till you get to white space or a syntactic break */ -  for (cp = dbp + 1; -       *cp && *cp != '(' && *cp != ')' && !isspace (*cp); -       cp++) -    continue; -  pfnote (savenstr (dbp, cp-dbp), TRUE, -	  lb.buffer, cp - lb.buffer + 1, lineno, linecharno); -}  /* Find tags in TeX and LaTeX input files.  */ @@ -3647,12 +4183,9 @@ void  TeX_functions (inf)       FILE *inf;  { -  char *lasthit; +  char *cp, *lasthit;    register int i; -  lineno = 0; -  charno = 0; -    /* Select either \ or ! as escape character.  */    TEX_mode (inf); @@ -3660,19 +4193,16 @@ TeX_functions (inf)    if (!TEX_toktab)      TEX_toktab = TEX_decode_env ("TEXTAGS", TEX_defenv); -  while (!feof (inf)) -    {				/* Scan each line in file */ -      lineno++; -      linecharno = charno; -      charno += readline (&lb, inf); -      dbp = lb.buffer; -      lasthit = dbp; -      while (dbp = etags_strchr (dbp, TEX_esc))	/* Look at each esc in line */ +  LOOP_ON_INPUT_LINES (inf, lb, cp) +    { +      lasthit = cp; +      /* Look at each esc in line. */ +      while ((cp = etags_strchr (cp, TEX_esc)) != NULL)  	{ -	  if (!*(++dbp)) +	  if (*++cp == '\0')  	    break; -	  linecharno += dbp - lasthit; -	  lasthit = dbp; +	  linecharno += cp - lasthit; +	  lasthit = cp;  	  i = TEX_Token (lasthit);  	  if (i >= 0)  	    { @@ -3724,6 +4254,8 @@ TEX_mode (inf)        TEX_opgrp = '<';        TEX_clgrp = '>';      } +  /* If the input file is compressed, inf is a pipe, and rewind may fail. +     No attempt is made to correct the situation. */    rewind (inf);  } @@ -3751,7 +4283,7 @@ TEX_decode_env (evarname, defenv)    /* Allocate a token table */    for (size = 1, p = env; p;) -    if ((p = etags_strchr (p, ':')) && *(++p)) +    if ((p = etags_strchr (p, ':')) && *++p != '\0')        size++;    /* Add 1 to leave room for null terminator.  */    tab = xnew (size + 1, struct TEX_tabent); @@ -3784,7 +4316,7 @@ TEX_decode_env (evarname, defenv)  /* If the text at CP matches one of the tag-defining TeX command names,     return the pointer to the first occurrence of that command in TEX_toktab.     Otherwise return -1. -   Keep the capital `T' in `Token' for dumb truncating compilers +   Keep the capital `T' in `token' for dumb truncating compilers     (this distinguishes it from `TEX_toktab' */  int  TEX_Token (cp) @@ -3802,18 +4334,17 @@ TEX_Token (cp)   * Prolog support (rewritten) by Anders Lindgren, Mar. 96   *   * Assumes that the predicate starts at column 0. - * Only the first clause of a predicate is added.  + * Only the first clause of a predicate is added.   */  int prolog_pred ();  void prolog_skip_comment ();  int prolog_atom (); -int eat_white ();  void  Prolog_functions (inf)       FILE *inf;  { -  char * last; +  char *cp, *last;    int len;    int allocated; @@ -3821,32 +4352,24 @@ Prolog_functions (inf)    len = 0;    last = NULL; -  lineno = 0; -  linecharno = 0; -  charno = 0; - -  while (!feof (inf)) +  LOOP_ON_INPUT_LINES (inf, lb, cp)      { -      lineno++; -      linecharno += charno; -      charno = readline (&lb, inf); -      dbp = lb.buffer; -      if (dbp[0] == '\0')	/* Empty line */ +      if (cp[0] == '\0')	/* Empty line */  	continue; -      else if (isspace (dbp[0])) /* Not a predicate */ +      else if (isspace (cp[0])) /* Not a predicate */  	continue; -      else if (dbp[0] == '/' && dbp[1] == '*')	/* comment. */ +      else if (cp[0] == '/' && cp[1] == '*')	/* comment. */  	prolog_skip_comment (&lb, inf); -      else if (len = prolog_pred (dbp, last))  +      else if ((len = prolog_pred (cp, last)) > 0)  	{  	  /* Predicate.  Store the function name so that we only  	     generate a tag for the first clause.  */  	  if (last == NULL)  	    last = xnew(len + 1, char);  	  else if (len + 1 > allocated) -	    last = (char *) xrealloc(last, len + 1); +	    last = xrnew (last, len + 1, char);  	  allocated = len + 1; -	  strncpy (last, dbp, len); +	  strncpy (last, cp, len);  	  last[len] = '\0';  	}      } @@ -3855,7 +4378,7 @@ Prolog_functions (inf)  void  prolog_skip_comment (plb, inf) -     struct linebuffer *plb; +     linebuffer *plb;       FILE *inf;  {    char *cp; @@ -3894,7 +4417,7 @@ prolog_pred (s, last)      return 0;    len = pos; -  pos += eat_white (s, pos); +  pos = skip_spaces (s + pos) - s;    if ((s[pos] == '(') || (s[pos] == '.'))      { @@ -3903,11 +4426,10 @@ prolog_pred (s, last)        /* Save only the first clause. */        if (last == NULL -	  || len != strlen (last) +	  || len != (int)strlen (last)  	  || !strneq (s, last, len))  	{ -	  pfnote (savenstr (s, len), TRUE, -		  s, pos, lineno, linecharno); +	  pfnote (savenstr (s, len), TRUE, s, pos, lineno, linecharno);  	  return len;  	}      } @@ -3946,7 +4468,7 @@ prolog_atom (s, pos)      {        pos++; -      while (1)  +      while (1)  	{  	  if (s[pos] == '\'')  	    { @@ -3972,24 +4494,8 @@ prolog_atom (s, pos)    else      return -1;  } - -/* Consume whitespace.  Return the number of bytes eaten. */ -int -eat_white (s, pos) -     char *s; -     int pos; -{ -  int origpos = pos; - -  origpos = pos; - -  while (isspace (s[pos])) -    pos++; - -  return pos - origpos; -} -/*  +/*   * Support for Erlang  --  Anders Lindgren, Feb 1996.   *   * Generates tags for functions, defines, and records. @@ -4004,7 +4510,7 @@ void  Erlang_functions (inf)       FILE *inf;  { -  char * last; +  char *cp, *last;    int len;    int allocated; @@ -4012,41 +4518,33 @@ Erlang_functions (inf)    len = 0;    last = NULL; -  lineno = 0; -  linecharno = 0; -  charno = 0; - -  while (!feof (inf)) +  LOOP_ON_INPUT_LINES (inf, lb, cp)      { -      lineno++; -      linecharno += charno; -      charno = readline (&lb, inf); -      dbp = lb.buffer; -      if (dbp[0] == '\0')	/* Empty line */ +      if (cp[0] == '\0')	/* Empty line */  	continue; -      else if (isspace (dbp[0])) /* Not function nor attribute */ +      else if (isspace (cp[0])) /* Not function nor attribute */  	continue; -      else if (dbp[0] == '%')	/* comment */ +      else if (cp[0] == '%')	/* comment */  	continue; -      else if (dbp[0] == '"')	/* Sometimes, strings start in column one */ +      else if (cp[0] == '"')	/* Sometimes, strings start in column one */  	continue; -      else if (dbp[0] == '-') 	/* attribute, e.g. "-define" */ +      else if (cp[0] == '-') 	/* attribute, e.g. "-define" */  	{ -	  erlang_attribute (dbp); +	  erlang_attribute (cp);  	  last = NULL;  	} -      else if (len = erlang_func (dbp, last))  +      else if ((len = erlang_func (cp, last)) > 0)  	{ -	  /*  +	  /*  	   * Function.  Store the function name so that we only  	   * generates a tag for the first clause.  	   */  	  if (last == NULL)  	    last = xnew (len + 1, char);  	  else if (len + 1 > allocated) -	    last = (char *) xrealloc (last, len + 1); +	    last = xrnew (last, len + 1, char);  	  allocated = len + 1; -	  strncpy (last, dbp, len); +	  strncpy (last, cp, len);  	  last[len] = '\0';  	}      } @@ -4076,16 +4574,15 @@ erlang_func (s, last)      return 0;    len = pos; -  pos += eat_white (s, pos); +  pos = skip_spaces (s + pos) - s;    /* Save only the first clause. */    if (s[pos++] == '('        && (last == NULL -	  || len != strlen (last) +	  || len != (int)strlen (last)  	  || !strneq (s, last, len)))  	{ -	  pfnote (savenstr (s, len), TRUE, -		  s, pos, lineno, linecharno); +	  pfnote (savenstr (s, len), TRUE, s, pos, lineno, linecharno);  	  return len;  	} @@ -4094,7 +4591,7 @@ erlang_func (s, last)  /* - * Handle attributes.  Currently, tags are generated for defines  + * Handle attributes.  Currently, tags are generated for defines   * and records.   *   * They are on the form: @@ -4111,13 +4608,14 @@ erlang_attribute (s)    if (strneq (s, "-define", 7) || strneq (s, "-record", 7))      { -      pos = 7 + eat_white (s, 7); -      if (s[pos++] == '(')  +      pos = skip_spaces (s + 7) - s; +      if (s[pos++] == '(')  	{ -	  pos += eat_white (s, pos); -	  if (len = erlang_atom (s, pos)) -	      pfnote (savenstr (& s[pos], len), TRUE, -		      s, pos + len, lineno, linecharno); +	  pos = skip_spaces (s + pos) - s; +	  len = erlang_atom (s, pos); +	  if (len != 0) +	    pfnote (savenstr (& s[pos], len), TRUE, +		    s, pos + len, lineno, linecharno);  	}      }    return; @@ -4149,7 +4647,7 @@ erlang_atom (s, pos)      {        pos++; -      while (1)  +      while (1)  	{  	  if (s[pos] == '\'')  	    { @@ -4175,6 +4673,7 @@ erlang_atom (s, pos)  }  #ifdef ETAGS_REGEXPS +  /* Take a string like "/blah/" and turn it into "blah", making sure     that the first and last characters are the same, and handling     quoted separator characters.  Actually, stops on the occurrence of @@ -4219,60 +4718,87 @@ scan_separators (name)  }  /* Look at the argument of --regex or --no-regex and do the right -   thing. */ +   thing.  Same for each line of a regexp file. */  void -analyse_regex (regex_arg) +analyse_regex (regex_arg, ignore_case)       char *regex_arg; +     bool ignore_case;  { -  struct stat stat_buf; -    if (regex_arg == NULL) +    free_patterns ();		/* --no-regex: remove existing regexps */ + +  /* A real --regexp option or a line in a regexp file. */ +  switch (regex_arg[0])      { -      /* Remove existing regexps. */ -      num_patterns = 0; -      patterns = NULL; -      return; -    } -  if (regex_arg[0] == '\0') -    { -      error ("missing regexp", (char *)NULL); -      return; -    } -  if (regex_arg[0] == '@' -      && stat (regex_arg + 1, &stat_buf) == 0) -    { -      FILE *regexfp; -      struct linebuffer regexbuf; -      char *regexfile = regex_arg + 1; +      /* Comments in regexp file or null arg to --regex. */ +    case '\0': +    case ' ': +    case '\t': +      break; -      /* regexfile is a file containing regexps, one per line. */ -      regexfp = fopen (regexfile, "r"); -      if (regexfp == NULL) -	{ -	  perror (regexfile); +      /* Read a regex file.  This is recursive and may result in a +	 loop, which will stop when the file descriptors are exhausted. */ +    case '@': +      { +	FILE *regexfp; +	linebuffer regexbuf; +	char *regexfile = regex_arg + 1; + +	/* regexfile is a file containing regexps, one per line. */ +	regexfp = fopen (regexfile, "r"); +	if (regexfp == NULL) +	  { +	    pfatal (regexfile); +	    return; +	  } +	initbuffer (®exbuf); +	while (readline_internal (®exbuf, regexfp) > 0) +	  analyse_regex (regexbuf.buffer, ignore_case); +	free (regexbuf.buffer); +	fclose (regexfp); +      } +      break; + +      /* Regexp to be used for a specific language only. */ +    case '{': +      { +	language *lang; +	char *lang_name = regex_arg + 1; +	char *cp; + +	for (cp = lang_name; *cp != '}'; cp++) +	  if (*cp == '\0') +	    { +	      error ("unterminated language name in regex: %s", regex_arg); +	      return; +	    } +	*cp = '\0'; +	lang = get_language_from_name (lang_name); +	if (lang == NULL)  	  return; -	} -      initbuffer (®exbuf); -      while (readline_internal (®exbuf, regexfp)) -	add_regex (regexbuf.buffer); -      free (regexbuf.buffer); -      fclose (regexfp); -    } -  else -    { -      add_regex (regex_arg); +	add_regex (cp + 1, ignore_case, lang); +      } +      break; + +      /* Regexp to be used for any language. */ +    default: +      add_regex (regex_arg, ignore_case, NULL); +      break;      }  }  /* Turn a name, which is an ed-style (but Emacs syntax) regular     expression, into a real regular expression by compiling it. */  void -add_regex (regexp_pattern) +add_regex (regexp_pattern, ignore_case, lang)       char *regexp_pattern; +     bool ignore_case; +     language *lang;  {    char *name;    const char *err;    struct re_pattern_buffer *patbuf; +  pattern *pp;    if (regexp_pattern[strlen(regexp_pattern)-1] != regexp_pattern[0]) @@ -4289,12 +4815,12 @@ add_regex (regexp_pattern)    (void) scan_separators (name);    patbuf = xnew (1, struct re_pattern_buffer); -  patbuf->translate = NULL; +  /* Translation table to fold case if appropriate. */ +  patbuf->translate = (ignore_case) ? lc_trans : NULL;    patbuf->fastmap = NULL;    patbuf->buffer = NULL;    patbuf->allocated = 0; -  re_syntax_options = RE_INTERVALS;    err = re_compile_pattern (regexp_pattern, strlen (regexp_pattern), patbuf);    if (err != NULL)      { @@ -4302,16 +4828,14 @@ add_regex (regexp_pattern)        return;      } -  num_patterns += 1; -  if (num_patterns == 1) -    patterns = xnew (1, struct pattern); -  else -    patterns = ((struct pattern *) -		xrealloc (patterns, -			  (num_patterns * sizeof (struct pattern)))); -  patterns[num_patterns - 1].pattern = patbuf; -  patterns[num_patterns - 1].name_pattern = savestr (name); -  patterns[num_patterns - 1].error_signaled = FALSE; +  pp = p_head; +  p_head = xnew (1, pattern); +  p_head->regex = savestr (regexp_pattern); +  p_head->p_next = pp; +  p_head->language = lang; +  p_head->pattern = patbuf; +  p_head->name_pattern = savestr (name); +  p_head->error_signaled = FALSE;  }  /* @@ -4360,49 +4884,88 @@ substitute (in, out, regs)        *t++ = *out;    *t = '\0'; -  if (DEBUG && (t > result + size || t - result != strlen (result))) +  if (DEBUG && (t > result + size || t - result != (int)strlen (result)))      abort ();    return result;  } + +/* Deallocate all patterns. */ +void +free_patterns () +{ +  pattern *pp; +  while (p_head != NULL) +    { +      pp = p_head->p_next; +      free (p_head->regex); +      free (p_head->name_pattern); +      free (p_head); +      p_head = pp; +    } +  return; +} +void +get_tag (bp) +     register char *bp; +{ +  register char *cp; + +  if (*bp == '\0') +    return; +  /* Go till you get to white space or a syntactic break */ +  for (cp = bp + 1; +       *cp != '\0' && *cp != '(' && *cp != ')' && !isspace (*cp); +       cp++) +    continue; +  pfnote (savenstr (bp, cp-bp), TRUE, +	  lb.buffer, cp - lb.buffer + 1, lineno, linecharno); +} +  #endif /* ETAGS_REGEXPS */  /* Initialize a linebuffer for use */  void -initbuffer (linebuffer) -     struct linebuffer *linebuffer; +initbuffer (lbp) +     linebuffer *lbp;  { -  linebuffer->size = 200; -  linebuffer->buffer = xnew (200, char); +  lbp->size = 200; +  lbp->buffer = xnew (200, char);  }  /* - * Read a line of text from `stream' into `linebuffer'. - * Return the number of characters read from `stream', - * which is the length of the line including the newline, if any. + * Read a line of text from `stream' into `lbp', excluding the + * newline or CR-NL, if any.  Return the number of characters read from + * `stream', which is the length of the line including the newline. + * + * On DOS or Windows we do not count the CR character, if any, before the + * NL, in the returned length; this mirrors the behavior of emacs on those + * platforms (for text files, it translates CR-NL to NL as it reads in the + * file).   */  long -readline_internal (linebuffer, stream) -     struct linebuffer *linebuffer; +readline_internal (lbp, stream) +     linebuffer *lbp;       register FILE *stream;  { -  char *buffer = linebuffer->buffer; -  register char *p = linebuffer->buffer; +  char *buffer = lbp->buffer; +  register char *p = lbp->buffer;    register char *pend;    int chars_deleted; -  pend = p + linebuffer->size;	/* Separate to avoid 386/IX compiler bug.  */ +  pend = p + lbp->size;		/* Separate to avoid 386/IX compiler bug.  */    while (1)      {        register int c = getc (stream);        if (p == pend)  	{ -	  linebuffer->size *= 2; -	  buffer = (char *) xrealloc (buffer, linebuffer->size); -	  p += buffer - linebuffer->buffer; -	  pend = buffer + linebuffer->size; -	  linebuffer->buffer = buffer; +	  /* We're at the end of linebuffer: expand it. */ +	  lbp->size *= 2; +	  buffer = xrnew (buffer, lbp->size, char); +	  p += buffer - lbp->buffer; +	  pend = buffer + lbp->size; +	  lbp->buffer = buffer;  	}        if (c == EOF)  	{ @@ -4435,39 +4998,43 @@ readline_internal (linebuffer, stream)  	}        *p++ = c;      } -  linebuffer->len = p - buffer; +  lbp->len = p - buffer; -  return linebuffer->len + chars_deleted; +  return lbp->len + chars_deleted;  }  /*   * Like readline_internal, above, but in addition try to match the - * input line against any existing regular expressions. + * input line against relevant regular expressions.   */  long -readline (linebuffer, stream) -     struct linebuffer *linebuffer; +readline (lbp, stream) +     linebuffer *lbp;       FILE *stream;  {    /* Read new line. */ -  long result = readline_internal (linebuffer, stream); +  long result = readline_internal (lbp, stream);  #ifdef ETAGS_REGEXPS -  int i; +  int match; +  pattern *pp; -  /* Match against all listed patterns. */ -  if (linebuffer->len > 0) -    for (i = 0; i < num_patterns; ++i) +  /* Match against relevant patterns. */ +  if (lbp->len > 0) +    for (pp = p_head; pp != NULL; pp = pp->p_next)        { -	int match = re_match (patterns[i].pattern, linebuffer->buffer, -			      linebuffer->len, 0, &patterns[i].regs); +	/* Only use generic regexps or those for the current language. */ +	if (pp->language != NULL && pp->language != curlang) +	  continue; + +	match = re_match (pp->pattern, lbp->buffer, lbp->len, 0, &pp->regs);  	switch (match)  	  {  	  case -2:  	    /* Some error. */ -	    if (!patterns[i].error_signaled) +	    if (!pp->error_signaled)  	      { -		error ("error while matching pattern %d", i); -		patterns[i].error_signaled = TRUE; +		error ("error while matching \"%s\"", pp->regex); +		pp->error_signaled = TRUE;  	      }  	    break;  	  case -1: @@ -4475,49 +5042,27 @@ readline (linebuffer, stream)  	    break;  	  default:  	    /* Match occurred.  Construct a tag. */ -	    if (patterns[i].name_pattern[0] != '\0') +	    if (pp->name_pattern[0] != '\0')  	      {  		/* Make a named tag. */ -		char *name = substitute (linebuffer->buffer, -					 patterns[i].name_pattern, -					 &patterns[i].regs); +		char *name = substitute (lbp->buffer, +					 pp->name_pattern, &pp->regs);  		if (name != NULL) -		  pfnote (name, TRUE, -			  linebuffer->buffer, match, lineno, linecharno); +		  pfnote (name, TRUE, lbp->buffer, match, lineno, linecharno);  	      }  	    else  	      {  		/* Make an unnamed tag. */  		pfnote ((char *)NULL, TRUE, -			linebuffer->buffer, match, lineno, linecharno); +			lbp->buffer, match, lineno, linecharno);  	      }  	    break;  	  }        }  #endif /* ETAGS_REGEXPS */ -   -  return result; -} -/* - * Read a file, but do no processing.  This is used to do regexp - * matching on files that have no language defined. - */ -void -just_read_file (inf) -     FILE *inf; -{ -  lineno = 0; -  charno = 0; - -  while (!feof (inf)) -    { -      ++lineno; -      linecharno = charno; -      charno += readline (&lb, inf); -    } +  return result;  } -  /*   * Return a pointer to a space of size strlen(cp)+1 allocated @@ -4587,6 +5132,26 @@ etags_strchr (sp, c)    return NULL;  } +/* Skip spaces, return new pointer. */ +char * +skip_spaces (cp) +     char *cp; +{ +  while (isspace (*cp))		/* isspace('\0')==FALSE */ +    cp++; +  return cp; +} + +/* Skip non spaces, return new pointer. */ +char * +skip_non_spaces (cp) +     char *cp; +{ +  while (!iswhite (*cp))	/* iswhite('\0')==TRUE */ +    cp++; +  return cp; +} +  /* Print error message and exit.  */  void  fatal (s1, s2) @@ -4607,8 +5172,14 @@ pfatal (s1)  void  suggest_asking_for_help ()  { -  fprintf (stderr, "\tTry `%s --help' for a complete list of options.\n", -	   progname); +  fprintf (stderr, "\tTry `%s %s' for a complete list of options.\n", +	   progname, +#ifdef LONG_OPTIONS +	   "--help" +#else +	   "-h" +#endif +	   );    exit (BAD);  } @@ -4644,7 +5215,7 @@ concat (s1, s2, s3)  char *  etags_getcwd ()  { -#if defined (HAVE_GETCWD) || defined (WINDOWSNT) +#ifdef HAVE_GETCWD    int bufsize = 200;    char *path = xnew (bufsize, char); @@ -4657,19 +5228,7 @@ etags_getcwd ()        path = xnew (bufsize, char);      } -#if WINDOWSNT -  { -    /* Convert backslashes to slashes.  */ -    char *p; -    for (p = path; *p != '\0'; p++) -      if (*p == '\\') -	*p = '/'; -    /* Canonicalize drive letter case.  */ -    if (islower (path[0])) -      path[0] = toupper (path[0]); -  } -#endif - +  canonicalize_filename (path);    return path;  #else /* not HAVE_GETCWD */ @@ -4686,7 +5245,7 @@ etags_getcwd ()    return strdup (path);  #else /* not MSDOS */ -  struct linebuffer path; +  linebuffer path;    FILE *pipe;    initbuffer (&path); @@ -4700,27 +5259,29 @@ etags_getcwd ()  #endif /* not HAVE_GETCWD */  } -/* Return a newly allocated string containing the file name -   of FILE relative to the absolute directory DIR (which -   should end with a slash). */ +/* Return a newly allocated string containing the file name of FILE +   relative to the absolute directory DIR (which should end with a slash). */  char *  relative_filename (file, dir)       char *file, *dir;  { -  char *fp, *dp, *abs, *res; +  char *fp, *dp, *afn, *res;    int i;    /* Find the common root of file and dir (with a trailing slash). */ -  abs = absolute_filename (file, cwd); -  fp = abs; +  afn = absolute_filename (file, cwd); +  fp = afn;    dp = dir;    while (*fp++ == *dp++)      continue;    fp--, dp--;			/* back to the first differing char */ -  do {				/* look at the equal chars until '/' */ -    if (fp == abs) return abs;	/* first char differs, give up */ +#ifdef DOS_NT +  if (fp == afn && afn[0] != '/') /* cannot build a relative name */ +    return afn; +#endif +  do				/* look at the equal chars until '/' */      fp--, dp--; -  } while (*fp != '/'); +  while (*fp != '/');    /* Build a sequence of "../" strings for the resulting relative file name. */    i = 0; @@ -4733,21 +5294,20 @@ relative_filename (file, dir)    /* Add the file name relative to the common root of file and dir. */    strcat (res, fp + 1); -  free (abs); +  free (afn);    return res;  } -/* Return a newly allocated string containing the -   absolute file name of FILE given CWD (which should -   end with a slash). */ +/* Return a newly allocated string containing the absolute file name +   of FILE given DIR (which should end with a slash). */  char * -absolute_filename (file, cwd) -     char *file, *cwd; +absolute_filename (file, dir) +     char *file, *dir;  {    char *slashp, *cp, *res; -  if (absolutefn (file)) +  if (filename_is_absolute (file))      res = savestr (file);  #ifdef DOS_NT    /* We don't support non-absolute file names with a drive @@ -4756,7 +5316,7 @@ absolute_filename (file, cwd)      fatal ("%s: relative file names with drive letters not supported", file);  #endif    else -    res = concat (cwd, file, ""); +    res = concat (dir, file, "");    /* Delete the "/dirname/.." and "/." substrings. */    slashp = etags_strchr (res, '/'); @@ -4770,7 +5330,7 @@ absolute_filename (file, cwd)  	      cp = slashp;  	      do  		cp--; -	      while (cp >= res && !absolutefn (cp)); +	      while (cp >= res && !filename_is_absolute (cp));  	      if (cp < res)  		cp = slashp;	/* the absolute name begins with "/.." */  #ifdef DOS_NT @@ -4794,12 +5354,6 @@ absolute_filename (file, cwd)        slashp = etags_strchr (slashp + 1, '/');      } -#ifdef DOS_NT -  /* Canonicalize drive letter case.  */ -  if (res[0] && islower (res[0])) -    res[0] = toupper (res[0]); -#endif -      if (res[0] == '\0')      return savestr ("/");    else @@ -4807,42 +5361,68 @@ absolute_filename (file, cwd)  }  /* Return a newly allocated string containing the absolute -   file name of dir where FILE resides given CWD (which should +   file name of dir where FILE resides given DIR (which should     end with a slash). */  char * -absolute_dirname (file, cwd) -     char *file, *cwd; +absolute_dirname (file, dir) +     char *file, *dir;  {    char *slashp, *res;    char save; -#ifdef DOS_NT -  char *p; - -  for (p = file; *p != '\0'; p++) -    if (*p == '\\') -      *p = '/'; -#endif +  canonicalize_filename (file);    slashp = etags_strrchr (file, '/');    if (slashp == NULL) -    return savestr (cwd); +    return savestr (dir);    save = slashp[1];    slashp[1] = '\0'; -  res = absolute_filename (file, cwd); +  res = absolute_filename (file, dir);    slashp[1] = save;    return res;  } +/* Whether the argument string is an absolute file name.  The argument +   string must have been canonicalized with canonicalize_filename. */ +bool +filename_is_absolute (fn) +     char *fn; +{ +  return (fn[0] == '/' +#ifdef DOS_NT +	  || (isalpha(fn[0]) && fn[1] == ':' && fn[2] == '/') +#endif +	  ); +} + +/* Translate backslashes into slashes.  Works in place. */ +void +canonicalize_filename (fn) +     register char *fn; +{ +#ifdef DOS_NT +  /* Convert backslashes to slashes.  */ +  for (; *fn != '\0'; fn++) +    if (*fn == '\\') +      *fn = '/'; +  /* Canonicalize drive letter case.  */ +  if (islower (path[0])) +    path[0] = toupper (path[0]); +#else +  /* No action. */ +  fn = NULL;			/* shut up the compiler */ +#endif +} +  /* Increase the size of a linebuffer. */  void -grow_linebuffer (bufp, toksize) -     struct linebuffer *bufp; +grow_linebuffer (lbp, toksize) +     linebuffer *lbp;       int toksize;  { -  while (bufp->size < toksize) -    bufp->size *= 2; -  bufp->buffer = (char *) xrealloc (bufp->buffer, bufp->size); +  while (lbp->size < toksize) +    lbp->size *= 2; +  lbp->buffer = xrnew (lbp->buffer, lbp->size, char);  }  /* Like malloc but get fatal error if memory is exhausted.  */ | 
