1 /* Protoize program - Original version by Ron Guilmette at MCC.
3 Copyright (C) 1989, 1992 Free Software Foundation, Inc.
5 This file is part of GNU CC.
7 GNU CC is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 2, or (at your option)
12 GNU CC is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with GNU CC; see the file COPYING. If not, write to
19 the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA. */
21 /* Any reasonable C++ compiler should have all of the same features
22 as __STDC__ plus more, so make sure that __STDC__ is defined if
23 __cplusplus is defined. */
25 #if defined(__cplusplus) && !defined(__STDC__)
27 #endif /* defined(__cplusplus) && !defined(__STDC__) */
29 #if defined(__GNUC__) || defined (__GNUG__)
30 #define VOLATILE volatile
41 #ifdef POSIX /* We should be able to define _POSIX_SOURCE unconditionally,
42 but some systems respond in buggy ways to it,
43 including Sunos 4.1.1. Which we don't classify as POSIX. */
44 /* In case this is a POSIX system with an ANSI C compiler,
45 ask for definition of all POSIX facilities. */
50 /* Users are not supposed to use _POSIX_SOURCE to say the
51 system is a POSIX system. That is not what _POSIX_SOURCE means! -- rms */
52 /* If the user asked for POSIX via _POSIX_SOURCE, turn on POSIX code. */
53 #if defined(_POSIX_SOURCE) && !defined(POSIX)
61 #include <sys/types.h>
64 #if ! defined (USG) || defined (SVR4)
71 #ifndef PATH_MAX /* <limits.h> defines this on most POSIX systems. */
72 #include <sys/param.h>
73 /* Sometimes <sys/param.h> defines these macros. */
93 extern char *sys_errlist[];
94 extern char *version_string;
96 /* Systems which are compatible only with POSIX 1003.1-1988 (but *not*
97 with POSIX 1003.1-1990), e.g. Ultrix 4.2, might not have
98 const qualifiers in the prototypes in the system include files.
99 Unfortunately, this can lead to GCC issuing lots of warnings for
100 calls to the following functions. To eliminate these warnings we
101 provide the following #defines. */
103 #define my_access(file,flag) access((char *)file, flag)
104 #define my_stat(file,pkt) stat((char *)file, pkt)
105 #define my_execvp(prog,argv) execvp((char *)prog, (char **)argv)
106 #define my_link(file1, file2) link((char *)file1, (char *)file2)
107 #define my_unlink(file) unlink((char *)file)
108 #define my_open(file, mode, flag) open((char *)file, mode, flag)
109 #define my_chmod(file, mode) chmod((char *)file, mode)
111 #if !(defined (USG) || defined (VMS) || defined (POSIX))
112 #define GUESSPATHLEN (MAXPATHLEN + 1)
113 #else /* (defined (USG) || defined (VMS) || defined (POSIX)) */
114 /* We actually use this as a starting point, not a limit. */
115 #define GUESSPATHLEN 200
116 #endif /* (defined (USG) || defined (VMS) || defined (POSIX)) */
118 /* Aliases for pointers to void.
119 These were made to facilitate compilation with other compilers. */
122 typedef void * pointer_type;
123 typedef const void * const_pointer_type;
125 typedef char * pointer_type;
126 typedef char * const_pointer_type;
137 #else /* !defined(POSIX) */
139 #define R_OK 4 /* Test for Read permission */
140 #define W_OK 2 /* Test for Write permission */
141 #define X_OK 1 /* Test for eXecute permission */
142 #define F_OK 0 /* Test for existence of File */
147 /* Virtually every UN*X system now in common use (except for pre-4.3-tahoe
148 BSD systems) now provides getcwd as called for by POSIX. Allow for
149 the few exceptions to the general rule here. */
151 #if !(defined (USG) || defined (VMS))
152 extern char *getwd ();
153 #define getcwd(buf,len) getwd(buf)
154 #else /* (defined (USG) || defined (VMS)) */
155 extern char *getcwd ();
156 #endif /* (defined (USG) || defined (VMS)) */
158 /* Declaring stat or __flsbuf with a prototype
159 causes conflicts with system headers on some systems. */
162 extern VOLATILE void abort ();
166 #if 0 /* These conflict with stdio.h on some systems. */
167 extern int fprintf (FILE *, const char *, ...);
168 extern int printf (const char *, ...);
171 extern pointer_type malloc ();
172 extern pointer_type realloc ();
177 extern int fflush ();
182 #if 0 /* Causes trouble on some systems that define setjmp as a macro. */
183 extern int setjmp ();
184 extern void longjmp ();
187 extern char * strcat ();
188 extern int strcmp ();
189 extern char * strcpy ();
190 #if 0 /* size_t from sys/types.h may fail to match GCC.
191 If so, we would get a warning from this.
192 So do without the prototype. */
193 extern size_t strlen (const char *);
195 extern int strncmp ();
196 extern char * strncpy ();
197 extern char * strrchr ();
199 /* Fork is not declared because the declaration caused a conflict
201 #if !(defined (USG) || defined (VMS))
203 #endif /* (defined (USG) || defined (VMS)) */
205 #endif /* !defined (POSIX) */
207 /* Look for these where the `const' qualifier is intentionally cast aside. */
211 /* Define a STRINGIFY macro that's right for ANSI or traditional C. */
214 #define STRINGIFY(STRING) #STRING
216 #define STRINGIFY(STRING) "STRING"
219 /* POSIX systems will not have definitions for WIFEXITED or WEXITSTATUS.
220 Define them correctly and so that they work for all environments. */
223 #define WIFEXITED(status_word) ((*((int *)&status_word) & 0xff) == 0x00)
226 #define WEXITSTATUS(status_word) ((*((int *)&status_word) & 0xff00) >> 8)
228 /* Define a default place to find the SYSCALLS.X file. */
230 #ifndef STD_PROTO_DIR
231 #define STD_PROTO_DIR "/usr/local/lib"
232 #endif /* !defined (STD_PROTO_DIR) */
234 /* Suffix of aux_info files. */
236 static const char * const aux_info_suffix = ".X";
238 /* String to attach to filenames for saved versions of original files. */
240 static const char * const save_suffix = ".save";
244 /* File name of the file which contains descriptions of standard system
245 routines. Note that we never actually do anything with this file per se,
246 but we do read in its corresponding aux_info file. */
248 static const char syscalls_filename[] = "SYSCALLS.c";
250 /* Default place to find the above file. */
252 static const char * const default_syscalls_dir = STD_PROTO_DIR;
254 /* Variable to hold the complete absolutized filename of the SYSCALLS.c.X
257 static char * syscalls_absolute_filename;
259 #endif /* !defined (UNPROTOIZE) */
261 /* Type of the structure that holds information about macro unexpansions. */
263 struct unexpansion_struct {
264 const char *expanded;
265 const char *contracted;
267 typedef struct unexpansion_struct unexpansion;
269 /* A table of conversions that may need to be made for some (stupid) older
270 operating systems where these types are preprocessor macros rather than
271 typedefs (as they really ought to be).
273 WARNING: The contracted forms must be as small (or smaller) as the
274 expanded forms, or else havoc will ensue. */
276 static const unexpansion unexpansions[] = {
277 { "struct _iobuf", "FILE" },
281 /* The number of "primary" slots in the hash tables for filenames and for
282 function names. This can be as big or as small as you like, except that
283 it must be a power of two. */
285 #define HASH_TABLE_SIZE (1 << 9)
287 /* Bit mask to use when computing hash values. */
289 static const int hash_mask = (HASH_TABLE_SIZE - 1);
291 /* Make a table of default system include directories
292 just as it is done in cccp.c. */
294 #ifndef STANDARD_INCLUDE_DIR
295 #define STANDARD_INCLUDE_DIR "/usr/include"
298 #ifndef LOCAL_INCLUDE_DIR
299 #define LOCAL_INCLUDE_DIR "/usr/local/include"
302 struct default_include { char *fname; int cplusplus; } include_defaults[]
303 #ifdef INCLUDE_DEFAULTS
307 /* Pick up GNU C++ specific include files. */
308 { GPLUSPLUS_INCLUDE_DIR, 1},
309 { GCC_INCLUDE_DIR, 0},
311 /* For cross-compilation, this dir name is generated
312 automatically in Makefile.in. */
313 { CROSS_INCLUDE_DIR, 0 },
314 #else /* not CROSS_COMPILE */
315 { LOCAL_INCLUDE_DIR, 0},
316 /* Some systems have an extra dir of include files. */
317 #ifdef SYSTEM_INCLUDE_DIR
318 { SYSTEM_INCLUDE_DIR, 0},
320 { STANDARD_INCLUDE_DIR, 0},
321 #endif /* not CROSS_COMPILE */
324 #endif /* no INCLUDE_DEFAULTS */
326 /* Datatype for lists of directories or filenames. */
330 struct string_list *next;
333 /* List of directories in which files should be converted. */
335 struct string_list *directory_list;
337 /* List of file names which should not be converted.
338 A file is excluded if the end of its name, following a /,
339 matches one of the names in this list. */
341 struct string_list *exclude_list;
343 /* The name of the other style of variable-number-of-parameters functions
344 (i.e. the style that we want to leave unconverted because we don't yet
345 know how to convert them to this style. This string is used in warning
348 /* Also define here the string that we can search for in the parameter lists
349 taken from the .X files which will unambiguously indicate that we have
350 found a varargs style function. */
353 static const char * const other_var_style = "stdarg";
354 #else /* !defined (UNPROTOIZE) */
355 static const char * const other_var_style = "varargs";
356 /* Note that this is a string containing the expansion of va_alist.
357 But in `main' we discard all but the first token. */
358 static const char *varargs_style_indicator = STRINGIFY (va_alist);
359 #endif /* !defined (UNPROTOIZE) */
361 /* The following two types are used to create hash tables. In this program,
362 there are two hash tables which are used to store and quickly lookup two
363 different classes of strings. The first type of strings stored in the
364 first hash table are absolute filenames of files which protoize needs to
365 know about. The second type of strings (stored in the second hash table)
366 are function names. It is this second class of strings which really
367 inspired the use of the hash tables, because there may be a lot of them. */
369 typedef struct hash_table_entry_struct hash_table_entry;
371 /* Do some typedefs so that we don't have to write "struct" so often. */
373 typedef struct def_dec_info_struct def_dec_info;
374 typedef struct file_info_struct file_info;
375 typedef struct f_list_chain_item_struct f_list_chain_item;
377 /* In the struct below, note that the "_info" field has two different uses
378 depending on the type of hash table we are in (i.e. either the filenames
379 hash table or the function names hash table). In the filenames hash table
380 the info fields of the entries point to the file_info struct which is
381 associated with each filename (1 per filename). In the function names
382 hash table, the info field points to the head of a singly linked list of
383 def_dec_info entries which are all defs or decs of the function whose
384 name is pointed to by the "symbol" field. Keeping all of the defs/decs
385 for a given function name on a special list specifically for that function
386 name makes it quick and easy to find out all of the important information
387 about a given (named) function. */
389 struct hash_table_entry_struct {
390 hash_table_entry * hash_next; /* -> to secondary entries */
391 const char * symbol; /* -> to the hashed string */
393 const def_dec_info * _ddip;
397 #define ddip _info._ddip
398 #define fip _info._fip
400 /* Define a type specifically for our two hash tables. */
402 typedef hash_table_entry hash_table[HASH_TABLE_SIZE];
404 /* The following struct holds all of the important information about any
405 single filename (e.g. file) which we need to know about. */
407 struct file_info_struct {
408 const hash_table_entry * hash_entry; /* -> to associated hash entry */
409 const def_dec_info * defs_decs; /* -> to chain of defs/decs */
410 time_t mtime; /* Time of last modification. */
413 /* Due to the possibility that functions may return pointers to functions,
414 (which may themselves have their own parameter lists) and due to the
415 fact that returned pointers-to-functions may be of type "pointer-to-
416 function-returning-pointer-to-function" (ad nauseum) we have to keep
417 an entire chain of ANSI style formal parameter lists for each function.
419 Normally, for any given function, there will only be one formals list
420 on the chain, but you never know.
422 Note that the head of each chain of formals lists is pointed to by the
423 `f_list_chain' field of the corresponding def_dec_info record.
425 For any given chain, the item at the head of the chain is the *leftmost*
426 parameter list seen in the actual C language function declaration. If
427 there are other members of the chain, then these are linked in left-to-right
428 order from the head of the chain. */
430 struct f_list_chain_item_struct {
431 const f_list_chain_item * chain_next; /* -> to next item on chain */
432 const char * formals_list; /* -> to formals list string */
435 /* The following struct holds all of the important information about any
436 single function definition or declaration which we need to know about.
437 Note that for unprotoize we don't need to know very much because we
438 never even create records for stuff that we don't intend to convert
439 (like for instance defs and decs which are already in old K&R format
440 and "implicit" function declarations). */
442 struct def_dec_info_struct {
443 const def_dec_info * next_in_file; /* -> to rest of chain for file */
444 file_info * file; /* -> file_info for containing file */
445 int line; /* source line number of def/dec */
446 const char * ansi_decl; /* -> left end of ansi decl */
447 hash_table_entry * hash_entry; /* -> hash entry for function name */
448 unsigned int is_func_def; /* = 0 means this is a declaration */
449 const def_dec_info * next_for_func; /* -> to rest of chain for func name */
450 unsigned int f_list_count; /* count of formals lists we expect */
451 char prototyped; /* = 0 means already prototyped */
453 const f_list_chain_item * f_list_chain; /* -> chain of formals lists */
454 const def_dec_info * definition; /* -> def/dec containing related def */
455 char is_static; /* = 0 means visiblilty is "extern" */
456 char is_implicit; /* != 0 for implicit func decl's */
457 char written; /* != 0 means written for implicit */
458 #else /* !defined (UNPROTOIZE) */
459 const char * formal_names; /* -> to list of names of formals */
460 const char * formal_decls; /* -> to string of formal declartions */
461 #endif /* !defined (UNPROTOIZE) */
464 /* Pointer to the tail component of the filename by which this program was
465 invoked. Used everywhere in error and warning messages. */
467 static const char *pname;
469 /* Error counter. Will be non-zero if we should give up at the next convenient
472 static int errors = 0;
475 /* ??? These comments should say what the flag mean as well as the options
478 /* File name to use for running gcc. Allows GCC 2 to be named
479 something other than gcc. */
480 static char *compiler_file_name = "gcc";
482 static int version_flag = 0; /* Print our version number. */
483 static int quiet_flag = 0; /* Don't print messages normally. */
484 static int nochange_flag = 0; /* Don't convert, just say what files
485 we would have converted. */
486 static int nosave_flag = 0; /* Don't save the old version. */
487 static int keep_flag = 0; /* Don't delete the .X files. */
488 static const char ** compile_params = 0; /* Option string for gcc. */
490 static const char *indent_string = " "; /* Indentation for newly
491 inserted parm decls. */
492 #else /* !defined (UNPROTOIZE) */
493 static int local_flag = 0; /* Insert new local decls (when?). */
494 static int global_flag = 0; /* set by -g option */
495 static int cplusplus_flag = 0; /* Rename converted files to *.C. */
496 static const char* nondefault_syscalls_dir = 0; /* Dir to look for
498 #endif /* !defined (UNPROTOIZE) */
500 /* An index into the compile_params array where we should insert the filename
501 parameter when we are ready to exec the C compiler. A zero value indicates
502 that we have not yet called munge_compile_params. */
504 static int filename_index = 0;
506 /* Count of command line arguments which were "filename" arguments. */
508 static int n_base_source_files = 0;
510 /* Points to a malloc'ed list of pointers to all of the filenames of base
511 source files which were specified on the command line. */
513 static const char **base_source_filenames;
515 /* Line number of the line within the current aux_info file that we
516 are currently processing. Used for error messages in case the prototypes
517 info file is corrupted somehow. */
519 static int current_aux_info_lineno;
521 /* Pointer to the name of the source file currently being converted. */
523 static const char *convert_filename;
525 /* Pointer to relative root string (taken from aux_info file) which indicates
526 where directory the user was in when he did the compilation step that
527 produced the containing aux_info file. */
529 static const char *invocation_filename;
531 /* Pointer to the base of the input buffer that holds the original text for the
532 source file currently being converted. */
534 static const char *orig_text_base;
536 /* Pointer to the byte just beyond the end of the input buffer that holds the
537 original text for the source file currently being converted. */
539 static const char *orig_text_limit;
541 /* Pointer to the base of the input buffer that holds the cleaned text for the
542 source file currently being converted. */
544 static const char *clean_text_base;
546 /* Pointer to the byte just beyond the end of the input buffer that holds the
547 cleaned text for the source file currently being converted. */
549 static const char *clean_text_limit;
551 /* Pointer to the last byte in the cleaned text buffer that we have already
552 (virtually) copied to the output buffer (or decided to ignore). */
554 static const char * clean_read_ptr;
556 /* Pointer to the base of the output buffer that holds the replacement text
557 for the source file currently being converted. */
559 static char *repl_text_base;
561 /* Pointer to the byte just beyond the end of the output buffer that holds the
562 replacement text for the source file currently being converted. */
564 static char *repl_text_limit;
566 /* Pointer to the last byte which has been stored into the output buffer.
567 The next byte to be stored should be stored just past where this points
570 static char * repl_write_ptr;
572 /* Pointer into the cleaned text buffer for the source file we are currently
573 converting. This points to the first character of the line that we last
574 did a "seek_to_line" to (see below). */
576 static const char *last_known_line_start;
578 /* Number of the line (in the cleaned text buffer) that we last did a
579 "seek_to_line" to. Will be one if we just read a new source file
580 into the cleaned text buffer. */
582 static int last_known_line_number;
584 /* The filenames hash table. */
586 static hash_table filename_primary;
588 /* The function names hash table. */
590 static hash_table function_name_primary;
592 /* The place to keep the recovery address which is used only in cases where
593 we get hopelessly confused by something in the cleaned original text. */
595 static jmp_buf source_confusion_recovery;
597 /* A pointer to the current directory filename (used by abspath). */
599 static char *cwd_buffer;
601 /* A place to save the read pointer until we are sure that an individual
602 attempt at editing will succeed. */
604 static const char * saved_clean_read_ptr;
606 /* A place to save the write pointer until we are sure that an individual
607 attempt at editing will succeed. */
609 static char * saved_repl_write_ptr;
611 /* Forward declaration. */
613 static const char *shortpath ();
615 /* Allocate some space, but check that the allocation was successful. */
616 /* alloca.c uses this, so don't make it static. */
624 rv = malloc (byte_count);
627 fprintf (stderr, "\n%s: fatal error: can't allocate %u more bytes of memory\n",
630 return 0; /* avoid warnings */
636 /* Reallocate some space, but check that the reallocation was successful. */
639 xrealloc (old_space, byte_count)
640 pointer_type old_space;
645 rv = realloc (old_space, byte_count);
648 fprintf (stderr, "\n%s: fatal error: can't allocate %u more bytes of memory\n",
651 return 0; /* avoid warnings */
657 /* Deallocate the area pointed to by an arbitrary pointer, but first, strip
658 the `const' qualifier from it and also make sure that the pointer value
663 const_pointer_type p;
666 free ((NONCONST pointer_type) p);
669 /* Make a copy of a string INPUT with size SIZE. */
672 savestring (input, size)
676 char *output = (char *) xmalloc (size + 1);
677 strcpy (output, input);
681 /* More 'friendly' abort that prints the line and file.
682 config.h can #define abort fancy_abort if you like that sort of thing. */
687 fprintf (stderr, "%s: internal abort\n", pname);
691 /* Make a duplicate of a given string in a newly allocated area. */
697 return strcpy ((char *) xmalloc (strlen (s) + 1), s);
700 /* Make a duplicate of the first N bytes of a given string in a newly
708 char *ret_val = strncpy ((char *) xmalloc (n + 1), s, n);
714 /* Return a pointer to the first occurance of s2 within s1 or NULL if s2
715 does not occur within s1. Assume neither s1 nor s2 are null pointers. */
720 const char *const s2;
728 for (p1 = s1, p2 = s2; c = *p2; p1++, p2++)
738 /* Get setup to recover in case the edit we are about to do goes awry. */
743 saved_clean_read_ptr = clean_read_ptr;
744 saved_repl_write_ptr = repl_write_ptr;
747 /* Call this routine to recover our previous state whenever something looks
748 too confusing in the source code we are trying to edit. */
753 clean_read_ptr = saved_clean_read_ptr;
754 repl_write_ptr = saved_repl_write_ptr;
757 /* Return true if the given character is a legal identifier character. */
763 return (isalnum (ch) || (ch == '_') || (ch == '$'));
766 /* Give a message indicating the proper way to invoke this program and then
767 exit with non-zero status. */
773 fprintf (stderr, "%s: usage '%s [ -VqfnkN ] [ -i <istring> ] [ filename ... ]'\n",
775 #else /* !defined (UNPROTOIZE) */
776 fprintf (stderr, "%s: usage '%s [ -VqfnkNlgC ] [ -B <diname> ] [ filename ... ]'\n",
778 #endif /* !defined (UNPROTOIZE) */
782 /* Return true if the given filename (assumed to be an absolute filename)
783 designates a file residing anywhere beneath any one of the "system"
784 include directories. */
787 in_system_include_dir (path)
790 struct default_include *p;
793 abort (); /* Must be an absolutized filename. */
795 for (p = include_defaults; p->fname; p++)
796 if (!strncmp (path, p->fname, strlen (p->fname))
797 && path[strlen (p->fname)] == '/')
803 /* Return true if the given filename designates a file that the user has
804 read access to and for which the user has write access to the containing
808 file_could_be_converted (const char *path)
810 char *const dir_name = (char *) alloca (strlen (path) + 1);
812 if (my_access (path, R_OK))
816 char *dir_last_slash;
818 strcpy (dir_name, path);
819 dir_last_slash = strrchr (dir_name, '/');
821 *dir_last_slash = '\0';
823 abort (); /* Should have been an absolutized filename. */
826 if (my_access (path, W_OK))
832 /* Return true if the given filename designates a file that we are allowed
833 to modify. Files which we should not attempt to modify are (a) "system"
834 include files, and (b) files which the user doesn't have write access to,
835 and (c) files which reside in directories which the user doesn't have
836 write access to. Unless requested to be quiet, give warnings about
837 files that we will not try to convert for one reason or another. An
838 exception is made for "system" include files, which we never try to
839 convert and for which we don't issue the usual warnings. */
842 file_normally_convertable (const char *path)
844 char *const dir_name = alloca (strlen (path) + 1);
846 if (in_system_include_dir (path))
850 char *dir_last_slash;
852 strcpy (dir_name, path);
853 dir_last_slash = strrchr (dir_name, '/');
855 *dir_last_slash = '\0';
857 abort (); /* Should have been an absolutized filename. */
860 if (my_access (path, R_OK))
863 fprintf (stderr, "%s: warning: no read access for file `%s'\n",
864 pname, shortpath (NULL, path));
868 if (my_access (path, W_OK))
871 fprintf (stderr, "%s: warning: no write access for file `%s'\n",
872 pname, shortpath (NULL, path));
876 if (my_access (dir_name, W_OK))
879 fprintf (stderr, "%s: warning: no write access for dir containing `%s'\n",
880 pname, shortpath (NULL, path));
890 /* Return true if the given file_info struct refers to the special SYSCALLS.c.X
891 file. Return false otherwise. */
894 is_syscalls_file (fi_p)
895 const file_info *fi_p;
897 char const *f = fi_p->hash_entry->symbol;
898 size_t fl = strlen (f), sysl = sizeof (syscalls_filename) - 1;
899 return sysl <= fl && strcmp (f + fl - sysl, syscalls_filename) == 0;
902 #endif /* !defined (UNPROTOIZE) */
904 /* Check to see if this file will need to have anything done to it on this
905 run. If there is nothing in the given file which both needs conversion
906 and for which we have the necessary stuff to do the conversion, return
907 false. Otherwise, return true.
909 Note that (for protoize) it is only valid to call this function *after*
910 the connections between declarations and definitions have all been made
911 by connect_defs_and_decs. */
914 needs_to_be_converted (file_p)
915 const file_info *file_p;
917 const def_dec_info *ddp;
921 if (is_syscalls_file (file_p))
924 #endif /* !defined (UNPROTOIZE) */
926 for (ddp = file_p->defs_decs; ddp; ddp = ddp->next_in_file)
932 /* ... and if we a protoizing and this function is in old style ... */
934 /* ... and if this a definition or is a decl with an associated def ... */
935 && (ddp->is_func_def || (!ddp->is_func_def && ddp->definition))
937 #else /* defined (UNPROTOIZE) */
939 /* ... and if we are unprotoizing and this function is in new style ... */
942 #endif /* defined (UNPROTOIZE) */
944 /* ... then the containing file needs converting. */
949 /* Return 1 if the file name NAME is in a directory
950 that should be converted. */
953 directory_specified_p (name)
956 struct string_list *p;
958 for (p = directory_list; p; p = p->next)
959 if (!strncmp (name, p->name, strlen (p->name))
960 && name[strlen (p->name)] == '/')
962 const char *q = name + strlen (p->name) + 1;
964 /* If there are more slashes, it's in a subdir, so
965 this match doesn't count. */
977 /* Return 1 if the file named NAME should be excluded from conversion. */
980 file_excluded_p (name)
983 struct string_list *p;
984 int len = strlen (name);
986 for (p = exclude_list; p; p = p->next)
987 if (!strcmp (name + len - strlen (p->name), p->name)
988 && name[len - strlen (p->name) - 1] == '/')
994 /* Construct a new element of a string_list.
995 STRING is the new element value, and REST holds the remaining elements. */
997 static struct string_list *
998 string_list_cons (string, rest)
1000 struct string_list *rest;
1002 struct string_list *temp
1003 = (struct string_list *) xmalloc (sizeof (struct string_list));
1006 temp->name = string;
1010 /* ??? The GNU convention for mentioning function args in its comments
1011 is to capitalize them. So change "hash_tab_p" to HASH_TAB_P below.
1012 Likewise for all the other functions. */
1014 /* Given a hash table, apply some function to each node in the table. The
1015 table to traverse is given as the "hash_tab_p" argument, and the
1016 function to be applied to each node in the table is given as "func"
1020 visit_each_hash_node (hash_tab_p, func)
1021 const hash_table_entry *hash_tab_p;
1024 const hash_table_entry *primary;
1026 for (primary = hash_tab_p; primary < &hash_tab_p[HASH_TABLE_SIZE]; primary++)
1027 if (primary->symbol)
1029 hash_table_entry *second;
1032 for (second = primary->hash_next; second; second = second->hash_next)
1037 /* Initialize all of the fields of a new hash table entry, pointed
1038 to by the "p" parameter. Note that the space to hold the entry
1039 is assumed to have already been allocated before this routine is
1042 static hash_table_entry *
1044 hash_table_entry *p;
1047 p->hash_next = NULL;
1048 p->symbol = dupstr (s);
1054 /* Look for a particular function name or filename in the particular
1055 hash table indicated by "hash_tab_p". If the name is not in the
1056 given hash table, add it. Either way, return a pointer to the
1057 hash table entry for the given name. */
1059 static hash_table_entry *
1060 lookup (hash_tab_p, search_symbol)
1061 hash_table_entry *hash_tab_p;
1062 const char *search_symbol;
1065 const char *search_symbol_char_p = search_symbol;
1066 hash_table_entry *p;
1068 while (*search_symbol_char_p)
1069 hash_value += *search_symbol_char_p++;
1070 hash_value &= hash_mask;
1071 p = &hash_tab_p[hash_value];
1073 return add_symbol (p, search_symbol);
1074 if (!strcmp (p->symbol, search_symbol))
1076 while (p->hash_next)
1079 if (!strcmp (p->symbol, search_symbol))
1082 p->hash_next = (hash_table_entry *) xmalloc (sizeof (hash_table_entry));
1084 return add_symbol (p, search_symbol);
1087 /* Throw a def/dec record on the junk heap.
1089 Also, since we are not using this record anymore, free up all of the
1090 stuff it pointed to. */
1096 xfree (p->ansi_decl);
1100 const f_list_chain_item * curr;
1101 const f_list_chain_item * next;
1103 for (curr = p->f_list_chain; curr; curr = next)
1105 next = curr->chain_next;
1109 #endif /* !defined (UNPROTOIZE) */
1114 /* Unexpand as many macro symbol as we can find.
1116 If the given line must be unexpanded, make a copy of it in the heap and
1117 return a pointer to the unexpanded copy. Otherwise return NULL. */
1120 unexpand_if_needed (aux_info_line)
1121 const char *aux_info_line;
1123 static char *line_buf = 0;
1124 static int line_buf_size = 0;
1125 const unexpansion* unexp_p;
1126 int got_unexpanded = 0;
1128 char *copy_p = line_buf;
1132 line_buf_size = 1024;
1133 line_buf = (char *) xmalloc (line_buf_size);
1138 /* Make a copy of the input string in line_buf, expanding as necessary. */
1140 for (s = aux_info_line; *s != '\n'; )
1142 for (unexp_p = unexpansions; unexp_p->expanded; unexp_p++)
1144 const char *in_p = unexp_p->expanded;
1145 size_t len = strlen (in_p);
1147 if (*s == *in_p && !strncmp (s, in_p, len) && !is_id_char (s[len]))
1149 int size = strlen (unexp_p->contracted);
1151 if (copy_p + size - line_buf >= line_buf_size)
1153 int offset = copy_p - line_buf;
1155 line_buf_size += size;
1156 line_buf = (char *) xrealloc (line_buf, line_buf_size);
1157 copy_p = line_buf + offset;
1159 strcpy (copy_p, unexp_p->contracted);
1162 /* Assume the there will not be another replacement required
1163 within the text just replaced. */
1166 goto continue_outer;
1169 if (copy_p - line_buf == line_buf_size)
1171 int offset = copy_p - line_buf;
1173 line_buf = (char *) xrealloc (line_buf, line_buf_size);
1174 copy_p = line_buf + offset;
1179 if (copy_p + 2 - line_buf >= line_buf_size)
1181 int offset = copy_p - line_buf;
1183 line_buf = (char *) xrealloc (line_buf, line_buf_size);
1184 copy_p = line_buf + offset;
1189 return (got_unexpanded ? dupstr (line_buf) : 0);
1192 /* Return the absolutized filename for the given relative
1193 filename. Note that if that filename is already absolute, it may
1194 still be returned in a modified form because this routine also
1195 eliminates redundant slashes and single dots and eliminates double
1196 dots to get a shortest possible filename from the given input
1197 filename. The absolutization of relative filenames is made by
1198 assuming that the given filename is to be taken as relative to
1199 the first argument (cwd) or to the current directory if cwd is
1203 abspath (cwd, rel_filename)
1205 const char *rel_filename;
1207 /* Setup the current working directory as needed. */
1208 const char *cwd2 = (cwd) ? cwd : cwd_buffer;
1209 char *const abs_buffer
1210 = (char *) alloca (strlen (cwd2) + strlen (rel_filename) + 2);
1211 char *endp = abs_buffer;
1214 /* Copy the filename (possibly preceded by the current working
1215 directory name) into the absolutization buffer. */
1220 if (rel_filename[0] != '/')
1223 while (*endp++ = *src_p++)
1225 *(endp-1) = '/'; /* overwrite null */
1227 src_p = rel_filename;
1228 while (*endp++ = *src_p++)
1232 /* Now make a copy of abs_buffer into abs_buffer, shortening the
1233 filename (by taking out slashes and dots) as we go. */
1235 outp = inp = abs_buffer;
1236 *outp++ = *inp++; /* copy first slash */
1239 *outp++ = *inp++; /* copy second slash */
1245 else if (inp[0] == '/' && outp[-1] == '/')
1250 else if (inp[0] == '.' && outp[-1] == '/')
1254 else if (inp[1] == '/')
1259 else if ((inp[1] == '.') && (inp[2] == 0 || inp[2] == '/'))
1261 inp += (inp[2] == '/') ? 3 : 2;
1263 while (outp >= abs_buffer && *outp != '/')
1265 if (outp < abs_buffer)
1267 /* Catch cases like /.. where we try to backup to a
1268 point above the absolute root of the logical file
1271 fprintf (stderr, "%s: invalid file name: %s\n",
1272 pname, rel_filename);
1282 /* On exit, make sure that there is a trailing null, and make sure that
1283 the last character of the returned string is *not* a slash. */
1286 if (outp[-1] == '/')
1289 /* Make a copy (in the heap) of the stuff left in the absolutization
1290 buffer and return a pointer to the copy. */
1292 return dupstr (abs_buffer);
1295 /* Given a filename (and possibly a directory name from which the filename
1296 is relative) return a string which is the shortest possible
1297 equivalent for the corresponding full (absolutized) filename. The
1298 shortest possible equivalent may be constructed by converting the
1299 absolutized filename to be a relative filename (i.e. relative to
1300 the actual current working directory). However if a relative filename
1301 is longer, then the full absolute filename is returned.
1305 Note that "simple-minded" conversion of any given type of filename (either
1306 relative or absolute) may not result in a valid equivalent filename if any
1307 subpart of the original filename is actually a symbolic link. */
1310 shortpath (cwd, filename)
1312 const char *filename;
1316 char *cwd_p = cwd_buffer;
1318 int unmatched_slash_count = 0;
1319 size_t filename_len = strlen (filename);
1321 path_p = abspath (cwd, filename);
1322 rel_buf_p = rel_buffer = (char *) xmalloc (filename_len);
1324 while (*cwd_p && (*cwd_p == *path_p))
1329 if (!*cwd_p && (!*path_p || *path_p == '/')) /* whole pwd matched */
1331 if (!*path_p) /* input *is* the current path! */
1342 while (*cwd_p != '/') /* backup to last slash */
1349 unmatched_slash_count++;
1352 if (*cwd_p++ == '/')
1353 unmatched_slash_count++;
1354 while (unmatched_slash_count--)
1356 if (rel_buffer + filename_len <= rel_buf_p + 3)
1365 if (rel_buffer + filename_len <= rel_buf_p)
1368 while (*rel_buf_p++ = *path_p++);
1371 if (*(rel_buf_p-1) == '/')
1372 *--rel_buf_p = '\0';
1377 /* Lookup the given filename in the hash table for filenames. If it is a
1378 new one, then the hash table info pointer will be null. In this case,
1379 we create a new file_info record to go with the filename, and we initialize
1380 that record with some reasonable values. */
1383 find_file (filename, do_not_stat)
1386 /* FILENAME was const, but that causes a warning on AIX when calling stat.
1387 That is probably a bug in AIX, but might as well avoid the warning. */
1389 hash_table_entry *hash_entry_p;
1391 hash_entry_p = lookup (filename_primary, filename);
1392 if (hash_entry_p->fip)
1393 return hash_entry_p->fip;
1396 struct stat stat_buf;
1397 file_info *file_p = (file_info *) xmalloc (sizeof (file_info));
1399 /* If we cannot get status on any given source file, give a warning
1400 and then just set its time of last modification to infinity. */
1403 stat_buf.st_mtime = (time_t) 0;
1406 if (my_stat (filename, &stat_buf) == -1)
1408 fprintf (stderr, "%s: error: can't get status of `%s': %s\n",
1409 pname, shortpath (NULL, filename), sys_errlist[errno]);
1410 stat_buf.st_mtime = (time_t) -1;
1414 hash_entry_p->fip = file_p;
1415 file_p->hash_entry = hash_entry_p;
1416 file_p->defs_decs = NULL;
1417 file_p->mtime = stat_buf.st_mtime;
1422 /* Generate a fatal error because some part of the aux_info file is
1426 aux_info_corrupted ()
1428 fprintf (stderr, "\n%s: fatal error: aux info file corrupted at line %d\n",
1429 pname, current_aux_info_lineno);
1433 /* ??? This comment is vague. Say what the condition is for. */
1434 /* Check to see that a condition is true. This is kind of like an assert. */
1437 check_aux_info (cond)
1441 aux_info_corrupted ();
1444 /* Given a pointer to the closing right parenthesis for a particular formals
1445 list (in a aux_info file) find the corresponding left parenthesis and
1446 return a pointer to it. */
1449 find_corresponding_lparen (p)
1455 for (paren_depth = 1, q = p-1; paren_depth; q--)
1470 /* Given a line from an aux info file, and a time at which the aux info
1471 file it came from was created, check to see if the item described in
1472 the line comes from a file which has been modified since the aux info
1473 file was created. If so, return non-zero, else return zero. */
1476 referenced_file_is_newer (l, aux_info_mtime)
1478 time_t aux_info_mtime;
1484 check_aux_info (l[0] == '/');
1485 check_aux_info (l[1] == '*');
1486 check_aux_info (l[2] == ' ');
1489 const char *filename_start = p = l + 3;
1493 filename = (char *) alloca ((size_t) (p - filename_start) + 1);
1494 strncpy (filename, filename_start, (size_t) (p - filename_start));
1495 filename[p-filename_start] = '\0';
1498 /* Call find_file to find the file_info record associated with the file
1499 which contained this particular def or dec item. Note that this call
1500 may cause a new file_info record to be created if this is the first time
1501 that we have ever known about this particular file. */
1503 fi_p = find_file (abspath (invocation_filename, filename), 0);
1505 return (fi_p->mtime > aux_info_mtime);
1508 /* Given a line of info from the aux_info file, create a new
1509 def_dec_info record to remember all of the important information about
1510 a function definition or declaration.
1512 Link this record onto the list of such records for the particular file in
1513 which it occurred in proper (descending) line number order (for now).
1515 If there is an identical record already on the list for the file, throw
1516 this one away. Doing so takes care of the (useless and troublesome)
1517 duplicates which are bound to crop up due to multiple inclusions of any
1518 given individual header file.
1520 Finally, link the new def_dec record onto the list of such records
1521 pertaining to this particular function name. */
1524 save_def_or_dec (l, is_syscalls)
1529 const char *semicolon_p;
1530 def_dec_info *def_dec_p = (def_dec_info *) xmalloc (sizeof (def_dec_info));
1533 def_dec_p->written = 0;
1534 #endif /* !defined (UNPROTOIZE) */
1536 /* Start processing the line by picking off 5 pieces of information from
1537 the left hand end of the line. These are filename, line number,
1538 new/old/implicit flag (new = ANSI prototype format), definition or
1539 declaration flag, and extern/static flag). */
1541 check_aux_info (l[0] == '/');
1542 check_aux_info (l[1] == '*');
1543 check_aux_info (l[2] == ' ');
1546 const char *filename_start = p = l + 3;
1551 filename = (char *) alloca ((size_t) (p - filename_start) + 1);
1552 strncpy (filename, filename_start, (size_t) (p - filename_start));
1553 filename[p-filename_start] = '\0';
1555 /* Call find_file to find the file_info record associated with the file
1556 which contained this particular def or dec item. Note that this call
1557 may cause a new file_info record to be created if this is the first time
1558 that we have ever known about this particular file.
1560 Note that we started out by forcing all of the base source file names
1561 (i.e. the names of the aux_info files with the .X stripped off) into the
1562 filenames hash table, and we simultaneously setup file_info records for
1563 all of these base file names (even if they may be useless later).
1564 The file_info records for all of these "base" file names (properly)
1565 act as file_info records for the "original" (i.e. un-included) files
1566 which were submitted to gcc for compilation (when the -fgen-aux-info
1567 option was used). */
1569 def_dec_p->file = find_file (abspath (invocation_filename, filename), is_syscalls);
1573 const char *line_number_start = ++p;
1574 char line_number[10];
1578 strncpy (line_number, line_number_start, (size_t) (p - line_number_start));
1579 line_number[p-line_number_start] = '\0';
1580 def_dec_p->line = atoi (line_number);
1583 /* Check that this record describes a new-style, old-style, or implicit
1584 definition or declaration. */
1586 p++; /* Skip over the `:'. */
1587 check_aux_info ((*p == 'N') || (*p == 'O') || (*p == 'I'));
1589 /* Is this a new style (ANSI prototyped) definition or declaration? */
1591 def_dec_p->prototyped = (*p == 'N');
1595 /* Is this an implicit declaration? */
1597 def_dec_p->is_implicit = (*p == 'I');
1599 #endif /* !defined (UNPROTOIZE) */
1603 check_aux_info ((*p == 'C') || (*p == 'F'));
1605 /* Is this item a function definition (F) or a declaration (C). Note that
1606 we treat item taken from the syscalls file as though they were function
1607 definitions regardless of what the stuff in the file says. */
1609 def_dec_p->is_func_def = ((*p++ == 'F') || is_syscalls);
1612 def_dec_p->definition = 0; /* Fill this in later if protoizing. */
1613 #endif /* !defined (UNPROTOIZE) */
1615 check_aux_info (*p++ == ' ');
1616 check_aux_info (*p++ == '*');
1617 check_aux_info (*p++ == '/');
1618 check_aux_info (*p++ == ' ');
1621 check_aux_info ((!strncmp (p, "static", 6)) || (!strncmp (p, "extern", 6)));
1622 #else /* !defined (UNPROTOIZE) */
1623 if (!strncmp (p, "static", 6))
1624 def_dec_p->is_static = -1;
1625 else if (!strncmp (p, "extern", 6))
1626 def_dec_p->is_static = 0;
1628 check_aux_info (0); /* Didn't find either `extern' or `static'. */
1629 #endif /* !defined (UNPROTOIZE) */
1632 const char *ansi_start = p;
1634 p += 6; /* Pass over the "static" or "extern". */
1636 /* We are now past the initial stuff. Search forward from here to find
1637 the terminating semicolon that should immediately follow the entire
1638 ANSI format function declaration. */
1645 /* Make a copy of the ansi declaration part of the line from the aux_info
1648 def_dec_p->ansi_decl
1649 = dupnstr (ansi_start, (size_t) ((semicolon_p+1) - ansi_start));
1652 /* Backup and point at the final right paren of the final argument list. */
1656 /* Now isolate a whole set of formal argument lists, one-by-one. Normally,
1657 there will only be one list to isolate, but there could be more. */
1659 def_dec_p->f_list_count = 0;
1662 def_dec_p->f_list_chain = NULL;
1663 #endif /* !defined (UNPROTOIZE) */
1667 const char *left_paren_p = find_corresponding_lparen (p);
1670 f_list_chain_item *cip =
1671 (f_list_chain_item *) xmalloc (sizeof (f_list_chain_item));
1674 = dupnstr (left_paren_p + 1, (size_t) (p - (left_paren_p+1)));
1676 /* Add the new chain item at the head of the current list. */
1678 cip->chain_next = def_dec_p->f_list_chain;
1679 def_dec_p->f_list_chain = cip;
1681 #endif /* !defined (UNPROTOIZE) */
1682 def_dec_p->f_list_count++;
1684 p = left_paren_p - 2;
1686 /* p must now point either to another right paren, or to the last
1687 character of the name of the function that was declared/defined.
1688 If p points to another right paren, then this indicates that we
1689 are dealing with multiple formals lists. In that case, there
1690 really should be another right paren preceding this right paren. */
1695 check_aux_info (*--p == ')');
1700 const char *past_fn = p + 1;
1702 check_aux_info (*past_fn == ' ');
1704 /* Scan leftwards over the identifier that names the function. */
1706 while (is_id_char (*p))
1710 /* p now points to the leftmost character of the function name. */
1713 char *fn_string = (char *) alloca (past_fn - p + 1);
1715 strncpy (fn_string, p, (size_t) (past_fn - p));
1716 fn_string[past_fn-p] = '\0';
1717 def_dec_p->hash_entry = lookup (function_name_primary, fn_string);
1721 /* Look at all of the defs and decs for this function name that we have
1722 collected so far. If there is already one which is at the same
1723 line number in the same file, then we can discard this new def_dec_info
1726 As an extra assurance that any such pair of (nominally) identical
1727 function declarations are in fact identical, we also compare the
1728 ansi_decl parts of the lines from the aux_info files just to be on
1731 This comparison will fail if (for instance) the user was playing
1732 messy games with the preprocessor which ultimately causes one
1733 function declaration in one header file to look differently when
1734 that file is included by two (or more) other files. */
1737 const def_dec_info *other;
1739 for (other = def_dec_p->hash_entry->ddip; other; other = other->next_for_func)
1741 if (def_dec_p->line == other->line && def_dec_p->file == other->file)
1743 if (strcmp (def_dec_p->ansi_decl, other->ansi_decl))
1745 fprintf (stderr, "%s: error: declaration of function `%s' at %s(%d) takes different forms\n",
1747 def_dec_p->hash_entry->symbol,
1748 def_dec_p->file->hash_entry->symbol,
1752 free_def_dec (def_dec_p);
1760 /* If we are doing unprotoizing, we must now setup the pointers that will
1761 point to the K&R name list and to the K&R argument declarations list.
1763 Note that if this is only a function declaration, then we should not
1764 expect to find any K&R style formals list following the ANSI-style
1765 formals list. This is because GCC knows that such information is
1766 useless in the case of function declarations (function definitions
1767 are a different story however).
1769 Since we are unprotoizing, we don't need any such lists anyway.
1770 All we plan to do is to delete all characters between ()'s in any
1773 def_dec_p->formal_names = NULL;
1774 def_dec_p->formal_decls = NULL;
1776 if (def_dec_p->is_func_def)
1779 check_aux_info (*++p == ' ');
1780 check_aux_info (*++p == '/');
1781 check_aux_info (*++p == '*');
1782 check_aux_info (*++p == ' ');
1783 check_aux_info (*++p == '(');
1786 const char *kr_names_start = ++p; /* Point just inside '('. */
1790 p--; /* point to closing right paren */
1792 /* Make a copy of the K&R parameter names list. */
1794 def_dec_p->formal_names
1795 = dupnstr (kr_names_start, (size_t) (p - kr_names_start));
1798 check_aux_info (*++p == ' ');
1801 /* p now points to the first character of the K&R style declarations
1802 list (if there is one) or to the star-slash combination that ends
1803 the comment in which such lists get embedded. */
1805 /* Make a copy of the K&R formal decls list and set the def_dec record
1808 if (*p == '*') /* Are there no K&R declarations? */
1810 check_aux_info (*++p == '/');
1811 def_dec_p->formal_decls = "";
1815 const char *kr_decls_start = p;
1817 while (p[0] != '*' || p[1] != '/')
1821 check_aux_info (*p == ' ');
1823 def_dec_p->formal_decls
1824 = dupnstr (kr_decls_start, (size_t) (p - kr_decls_start));
1827 /* Handle a special case. If we have a function definition marked as
1828 being in "old" style, and if it's formal names list is empty, then
1829 it may actually have the string "void" in its real formals list
1830 in the original source code. Just to make sure, we will get setup
1831 to convert such things anyway.
1833 This kludge only needs to be here because of an insurmountable
1834 problem with generating .X files. */
1836 if (!def_dec_p->prototyped && !*def_dec_p->formal_names)
1837 def_dec_p->prototyped = 1;
1840 /* Since we are unprotoizing, if this item is already in old (K&R) style,
1841 we can just ignore it. If that is true, throw away the itme now. */
1843 if (!def_dec_p->prototyped)
1845 free_def_dec (def_dec_p);
1849 #endif /* defined (UNPROTOIZE) */
1851 /* Add this record to the head of the list of records pertaining to this
1852 particular function name. */
1854 def_dec_p->next_for_func = def_dec_p->hash_entry->ddip;
1855 def_dec_p->hash_entry->ddip = def_dec_p;
1857 /* Add this new def_dec_info record to the sorted list of def_dec_info
1858 records for this file. Note that we don't have to worry about duplicates
1859 (caused by multiple inclusions of header files) here because we have
1860 already eliminated duplicates above. */
1862 if (!def_dec_p->file->defs_decs)
1864 def_dec_p->file->defs_decs = def_dec_p;
1865 def_dec_p->next_in_file = NULL;
1869 int line = def_dec_p->line;
1870 const def_dec_info *prev = NULL;
1871 const def_dec_info *curr = def_dec_p->file->defs_decs;
1872 const def_dec_info *next = curr->next_in_file;
1874 while (next && (line < curr->line))
1878 next = next->next_in_file;
1880 if (line >= curr->line)
1882 def_dec_p->next_in_file = curr;
1884 ((NONCONST def_dec_info *) prev)->next_in_file = def_dec_p;
1886 def_dec_p->file->defs_decs = def_dec_p;
1888 else /* assert (next == NULL); */
1890 ((NONCONST def_dec_info *) curr)->next_in_file = def_dec_p;
1891 /* assert (next == NULL); */
1892 def_dec_p->next_in_file = next;
1897 /* Rewrite the options list used to recompile base source files. All we are
1898 really doing here is removing -g, -O, -S, -c, and -o options, and then
1899 adding a final group of options like '-fgen-aux-info -S -o /dev/null'. */
1902 munge_compile_params (params_list)
1903 const char *params_list;
1906 = (char **) alloca ((strlen (params_list) + 6) * sizeof (char *));
1907 int param_count = 0;
1910 temp_params[param_count++] = compiler_file_name;
1913 while (isspace (*params_list))
1917 param = params_list;
1918 while (*params_list && !isspace (*params_list))
1920 if (param[0] != '-')
1921 temp_params[param_count++]
1922 = dupnstr (param, (size_t) (params_list - param));
1931 break; /* Don't copy these. */
1933 while (isspace (*params_list))
1935 while (*params_list && !isspace (*params_list))
1939 temp_params[param_count++]
1940 = dupnstr (param, (size_t) (params_list - param));
1946 temp_params[param_count++] = "-fgen-aux-info";
1947 temp_params[param_count++] = "-S";
1948 temp_params[param_count++] = "-o";
1949 temp_params[param_count++] = "/dev/null";
1951 /* Leave room for the filename argument and a terminating null pointer. */
1953 temp_params[filename_index = param_count++] = NULL;
1954 temp_params[param_count++] = NULL;
1956 /* Make a copy of the compile_params in heap space. */
1959 = (const char **) xmalloc (sizeof (char *) * (param_count+1));
1960 memcpy (compile_params, temp_params, sizeof (char *) * param_count);
1963 /* Do a recompilation for the express purpose of generating a new aux_info
1964 file to go with a specific base source file. */
1967 gen_aux_info_file (base_filename)
1968 const char *base_filename;
1972 if (!filename_index)
1973 munge_compile_params ("");
1975 compile_params[filename_index] = shortpath (NULL, base_filename);
1978 fprintf (stderr, "%s: compiling `%s'\n",
1979 pname, compile_params[filename_index]);
1981 if (child_pid = fork ())
1983 if (child_pid == -1)
1985 fprintf (stderr, "%s: error: could not fork process: %s\n",
1986 pname, sys_errlist[errno]);
1991 /* Print out the command line that the other process is now executing. */
1997 fputs ("\t", stderr);
1998 for (arg = compile_params; *arg; arg++)
2000 fputs (*arg, stderr);
2001 fputc (' ', stderr);
2003 fputc ('\n', stderr);
2011 if (wait (&wait_status) == -1)
2013 fprintf (stderr, "%s: error: wait for process failed: %s\n",
2014 pname, sys_errlist[errno]);
2017 if (!WIFEXITED (wait_status))
2019 fprintf (stderr, "%s: error: subprocess %ld did not exit\n",
2020 pname, (long) child_pid);
2021 kill (child_pid, 9);
2024 if (WEXITSTATUS (wait_status) != 0)
2026 fprintf (stderr, "%s: error: %s: compilation failed\n",
2027 pname, base_filename);
2035 if (my_execvp (compile_params[0], (char *const *) compile_params))
2037 int e = errno, f = fileno (stderr);
2038 write (f, pname, strlen (pname));
2040 write (f, compile_params[0], strlen (compile_params[0]));
2042 write (f, sys_errlist[e], strlen (sys_errlist[e]));
2046 return 1; /* Never executed. */
2050 /* Read in all of the information contained in a single aux_info file.
2051 Save all of the important stuff for later. */
2054 process_aux_info_file (base_source_filename, keep_it, is_syscalls)
2055 const char *base_source_filename;
2059 size_t base_len = strlen (base_source_filename);
2060 char * aux_info_filename
2061 = (char *) alloca (base_len + strlen (aux_info_suffix) + 1);
2062 char *aux_info_base;
2063 char *aux_info_limit;
2064 char *aux_info_relocated_name;
2065 const char *aux_info_second_line;
2066 time_t aux_info_mtime;
2067 size_t aux_info_size;
2069 /* Construct the aux_info filename from the base source filename. */
2071 strcpy (aux_info_filename, base_source_filename);
2072 strcat (aux_info_filename, aux_info_suffix);
2074 /* Check that the aux_info file exists and is readable. If it does not
2075 exist, try to create it (once only). */
2083 if (my_access (aux_info_filename, R_OK) == -1)
2085 if (errno == ENOENT && retries == 0)
2089 fprintf (stderr, "%s: warning: missing SYSCALLS file `%s'\n",
2090 pname, aux_info_filename);
2093 if (!gen_aux_info_file (base_source_filename))
2103 fprintf (stderr, "%s: error: can't read aux info file `%s': %s\n",
2104 pname, shortpath (NULL, aux_info_filename),
2105 sys_errlist[errno]);
2113 struct stat stat_buf;
2115 /* Get some status information about this aux_info file. */
2117 if (my_stat (aux_info_filename, &stat_buf) == -1)
2119 fprintf (stderr, "%s: error: can't get status of aux info file `%s': %s\n",
2120 pname, shortpath (NULL, aux_info_filename),
2121 sys_errlist[errno]);
2126 /* Check on whether or not this aux_info file is zero length. If it is,
2127 then just ignore it and return. */
2129 if ((aux_info_size = stat_buf.st_size) == 0)
2132 /* Get the date/time of last modification for this aux_info file and
2133 remember it. We will have to check that any source files that it
2134 contains information about are at least this old or older. */
2136 aux_info_mtime = stat_buf.st_mtime;
2142 /* Open the aux_info file. */
2144 if ((aux_info_file = my_open (aux_info_filename, O_RDONLY, 0444 )) == -1)
2146 fprintf (stderr, "%s: error: can't open aux info file `%s' for reading: %s\n",
2147 pname, shortpath (NULL, aux_info_filename),
2148 sys_errlist[errno]);
2152 /* Allocate space to hold the aux_info file in memory. */
2154 aux_info_base = xmalloc (aux_info_size + 1);
2155 aux_info_limit = aux_info_base + aux_info_size;
2156 *aux_info_limit = '\0';
2158 /* Read the aux_info file into memory. */
2160 if (read (aux_info_file, aux_info_base, aux_info_size) != aux_info_size)
2162 fprintf (stderr, "%s: error: while reading aux info file `%s': %s\n",
2163 pname, shortpath (NULL, aux_info_filename),
2164 sys_errlist[errno]);
2165 free (aux_info_base);
2166 close (aux_info_file);
2170 /* Close the aux info file. */
2172 if (close (aux_info_file))
2174 fprintf (stderr, "%s: error: while closing aux info file `%s': %s\n",
2175 pname, shortpath (NULL, aux_info_filename),
2176 sys_errlist[errno]);
2177 free (aux_info_base);
2178 close (aux_info_file);
2183 /* Delete the aux_info file (unless requested not to). If the deletion
2184 fails for some reason, don't even worry about it. */
2187 if (my_unlink (aux_info_filename) == -1)
2188 fprintf (stderr, "%s: error: can't delete aux info file `%s': %s\n",
2189 pname, shortpath (NULL, aux_info_filename),
2190 sys_errlist[errno]);
2192 /* Save a pointer into the first line of the aux_info file which
2193 contains the filename of the directory from which the compiler
2194 was invoked when the associated source file was compiled.
2195 This information is used later to help create complete
2196 filenames out of the (potentially) relative filenames in
2197 the aux_info file. */
2200 char *p = aux_info_base;
2207 invocation_filename = p; /* Save a pointer to first byte of path. */
2212 while (*p++ != '\n')
2214 aux_info_second_line = p;
2215 aux_info_relocated_name = 0;
2216 if (invocation_filename[0] != '/')
2218 /* INVOCATION_FILENAME is relative;
2219 append it to BASE_SOURCE_FILENAME's dir. */
2221 aux_info_relocated_name = xmalloc (base_len + (p-invocation_filename));
2222 strcpy (aux_info_relocated_name, base_source_filename);
2223 dir_end = strrchr (aux_info_relocated_name, '/');
2227 dir_end = aux_info_relocated_name;
2228 strcpy (dir_end, invocation_filename);
2229 invocation_filename = aux_info_relocated_name;
2235 const char *aux_info_p;
2237 /* Do a pre-pass on the lines in the aux_info file, making sure that all
2238 of the source files referenced in there are at least as old as this
2239 aux_info file itself. If not, go back and regenerate the aux_info
2240 file anew. Don't do any of this for the syscalls file. */
2244 current_aux_info_lineno = 2;
2246 for (aux_info_p = aux_info_second_line; *aux_info_p; )
2248 if (referenced_file_is_newer (aux_info_p, aux_info_mtime))
2250 free (aux_info_base);
2251 xfree (aux_info_relocated_name);
2252 if (keep_it && my_unlink (aux_info_filename) == -1)
2254 fprintf (stderr, "%s: error: can't delete file `%s': %s\n",
2255 pname, shortpath (NULL, aux_info_filename),
2256 sys_errlist[errno]);
2262 /* Skip over the rest of this line to start of next line. */
2264 while (*aux_info_p != '\n')
2267 current_aux_info_lineno++;
2271 /* Now do the real pass on the aux_info lines. Save their information in
2272 the in-core data base. */
2274 current_aux_info_lineno = 2;
2276 for (aux_info_p = aux_info_second_line; *aux_info_p;)
2278 char *unexpanded_line = unexpand_if_needed (aux_info_p);
2280 if (unexpanded_line)
2282 save_def_or_dec (unexpanded_line, is_syscalls);
2283 free (unexpanded_line);
2286 save_def_or_dec (aux_info_p, is_syscalls);
2288 /* Skip over the rest of this line and get to start of next line. */
2290 while (*aux_info_p != '\n')
2293 current_aux_info_lineno++;
2297 free (aux_info_base);
2298 xfree (aux_info_relocated_name);
2303 /* Check an individual filename for a .c suffix. If the filename has this
2304 suffix, rename the file such that its suffix is changed to .C. This
2305 function implements the -C option. */
2309 const hash_table_entry *hp;
2311 const char *filename = hp->symbol;
2312 int last_char_index = strlen (filename) - 1;
2313 char *const new_filename = (char *) alloca (strlen (filename) + 1);
2315 /* Note that we don't care here if the given file was converted or not. It
2316 is possible that the given file was *not* converted, simply because there
2317 was nothing in it which actually required conversion. Even in this case,
2318 we want to do the renaming. Note that we only rename files with the .c
2321 if (filename[last_char_index] != 'c' || filename[last_char_index-1] != '.')
2324 strcpy (new_filename, filename);
2325 new_filename[last_char_index] = 'C';
2327 if (my_link (filename, new_filename) == -1)
2329 fprintf (stderr, "%s: warning: can't link file `%s' to `%s': %s\n",
2330 pname, shortpath (NULL, filename),
2331 shortpath (NULL, new_filename), sys_errlist[errno]);
2336 if (my_unlink (filename) == -1)
2338 fprintf (stderr, "%s: warning: can't delete file `%s': %s\n",
2339 pname, shortpath (NULL, filename), sys_errlist[errno]);
2345 #endif /* !defined (UNPROTOIZE) */
2347 /* Take the list of definitions and declarations attached to a particular
2348 file_info node and reverse the order of the list. This should get the
2349 list into an order such that the item with the lowest associated line
2350 number is nearest the head of the list. When these lists are originally
2351 built, they are in the opposite order. We want to traverse them in
2352 normal line number order later (i.e. lowest to highest) so reverse the
2356 reverse_def_dec_list (hp)
2357 const hash_table_entry *hp;
2359 file_info *file_p = hp->fip;
2360 const def_dec_info *prev = NULL;
2361 const def_dec_info *current = file_p->defs_decs;
2363 if (!( current = file_p->defs_decs))
2364 return; /* no list to reverse */
2367 if (! (current = current->next_in_file))
2368 return; /* can't reverse a single list element */
2370 ((NONCONST def_dec_info *) prev)->next_in_file = NULL;
2374 const def_dec_info *next = current->next_in_file;
2376 ((NONCONST def_dec_info *) current)->next_in_file = prev;
2381 file_p->defs_decs = prev;
2386 /* Find the (only?) extern definition for a particular function name, starting
2387 from the head of the linked list of entries for the given name. If we
2388 cannot find an extern definition for the given function name, issue a
2389 warning and scrounge around for the next best thing, i.e. an extern
2390 function declaration with a prototype attached to it. Note that we only
2391 allow such substitutions for extern declarations and never for static
2392 declarations. That's because the only reason we allow them at all is
2393 to let un-prototyped function declarations for system-supplied library
2394 functions get their prototypes from our own extra SYSCALLS.c.X file which
2395 contains all of the correct prototypes for system functions. */
2397 static const def_dec_info *
2398 find_extern_def (head, user)
2399 const def_dec_info *head;
2400 const def_dec_info *user;
2402 const def_dec_info *dd_p;
2403 const def_dec_info *extern_def_p = NULL;
2404 int conflict_noted = 0;
2406 /* Don't act too stupid here. Somebody may try to convert an entire system
2407 in one swell fwoop (rather than one program at a time, as should be done)
2408 and in that case, we may find that there are multiple extern definitions
2409 of a given function name in the entire set of source files that we are
2410 converting. If however one of these definitions resides in exactly the
2411 same source file as the reference we are trying to satisfy then in that
2412 case it would be stupid for us to fail to realize that this one definition
2413 *must* be the precise one we are looking for.
2415 To make sure that we don't miss an opportunity to make this "same file"
2416 leap of faith, we do a prescan of the list of records relating to the
2417 given function name, and we look (on this first scan) *only* for a
2418 definition of the function which is in the same file as the reference
2419 we are currently trying to satisfy. */
2421 for (dd_p = head; dd_p; dd_p = dd_p->next_for_func)
2422 if (dd_p->is_func_def && !dd_p->is_static && dd_p->file == user->file)
2425 /* Now, since we have not found a definition in the same file as the
2426 reference, we scan the list again and consider all possibilities from
2427 all files. Here we may get conflicts with the things listed in the
2428 SYSCALLS.c.X file, but if that happens it only means that the source
2429 code being converted contains its own definition of a function which
2430 could have been supplied by libc.a. In such cases, we should avoid
2431 issuing the normal warning, and defer to the definition given in the
2434 for (dd_p = head; dd_p; dd_p = dd_p->next_for_func)
2435 if (dd_p->is_func_def && !dd_p->is_static)
2437 if (!extern_def_p) /* Previous definition? */
2438 extern_def_p = dd_p; /* Remember the first definition found. */
2441 /* Ignore definition just found if it came from SYSCALLS.c.X. */
2443 if (is_syscalls_file (dd_p->file))
2446 /* Quietly replace the definition previously found with the one
2447 just found if the previous one was from SYSCALLS.c.X. */
2449 if (is_syscalls_file (extern_def_p->file))
2451 extern_def_p = dd_p;
2455 /* If we get here, then there is a conflict between two function
2456 declarations for the same function, both of which came from the
2459 if (!conflict_noted) /* first time we noticed? */
2462 fprintf (stderr, "%s: error: conflicting extern definitions of '%s'\n",
2463 pname, head->hash_entry->symbol);
2466 fprintf (stderr, "%s: declarations of '%s' will not be converted\n",
2467 pname, head->hash_entry->symbol);
2468 fprintf (stderr, "%s: conflict list for '%s' follows:\n",
2469 pname, head->hash_entry->symbol);
2470 fprintf (stderr, "%s: %s(%d): %s\n",
2472 shortpath (NULL, extern_def_p->file->hash_entry->symbol),
2473 extern_def_p->line, extern_def_p->ansi_decl);
2477 fprintf (stderr, "%s: %s(%d): %s\n",
2479 shortpath (NULL, dd_p->file->hash_entry->symbol),
2480 dd_p->line, dd_p->ansi_decl);
2484 /* We want to err on the side of caution, so if we found multiple conflicting
2485 definitions for the same function, treat this as being that same as if we
2486 had found no definitions (i.e. return NULL). */
2493 /* We have no definitions for this function so do the next best thing.
2494 Search for an extern declaration already in prototype form. */
2496 for (dd_p = head; dd_p; dd_p = dd_p->next_for_func)
2497 if (!dd_p->is_func_def && !dd_p->is_static && dd_p->prototyped)
2499 extern_def_p = dd_p; /* save a pointer to the definition */
2501 fprintf (stderr, "%s: warning: using formals list from %s(%d) for function `%s'\n",
2503 shortpath (NULL, dd_p->file->hash_entry->symbol),
2504 dd_p->line, dd_p->hash_entry->symbol);
2508 /* Gripe about unprototyped function declarations that we found no
2509 corresponding definition (or other source of prototype information)
2512 Gripe even if the unprototyped declaration we are worried about
2513 exists in a file in one of the "system" include directories. We
2514 can gripe about these because we should have at least found a
2515 corresponding (pseudo) definition in the SYSCALLS.c.X file. If we
2516 didn't, then that means that the SYSCALLS.c.X file is missing some
2517 needed prototypes for this particular system. That is worth telling
2522 const char *file = user->file->hash_entry->symbol;
2525 if (in_system_include_dir (file))
2527 /* Why copy this string into `needed' at all?
2528 Why not just use user->ansi_decl without copying? */
2529 char *needed = (char *) alloca (strlen (user->ansi_decl) + 1);
2532 strcpy (needed, user->ansi_decl);
2533 p = (NONCONST char *) substr (needed, user->hash_entry->symbol)
2534 + strlen (user->hash_entry->symbol) + 2;
2535 strcpy (p, "??\?);");
2537 fprintf (stderr, "%s: %d: `%s' used but missing from SYSCALLS\n",
2538 shortpath (NULL, file), user->line,
2539 needed+7); /* Don't print "extern " */
2542 fprintf (stderr, "%s: %d: warning: no extern definition for `%s'\n",
2543 shortpath (NULL, file), user->line,
2544 user->hash_entry->symbol);
2547 return extern_def_p;
2550 /* Find the (only?) static definition for a particular function name in a
2551 given file. Here we get the function-name and the file info indirectly
2552 from the def_dec_info record pointer which is passed in. */
2554 static const def_dec_info *
2555 find_static_definition (user)
2556 const def_dec_info *user;
2558 const def_dec_info *head = user->hash_entry->ddip;
2559 const def_dec_info *dd_p;
2560 int num_static_defs = 0;
2561 const def_dec_info *static_def_p = NULL;
2563 for (dd_p = head; dd_p; dd_p = dd_p->next_for_func)
2564 if (dd_p->is_func_def && dd_p->is_static && (dd_p->file == user->file))
2566 static_def_p = dd_p; /* save a pointer to the definition */
2569 if (num_static_defs == 0)
2572 fprintf (stderr, "%s: warning: no static definition for `%s' in file `%s'\n",
2573 pname, head->hash_entry->symbol,
2574 shortpath (NULL, user->file->hash_entry->symbol));
2576 else if (num_static_defs > 1)
2578 fprintf (stderr, "%s: error: multiple static defs of `%s' in file `%s'\n",
2579 pname, head->hash_entry->symbol,
2580 shortpath (NULL, user->file->hash_entry->symbol));
2583 return static_def_p;
2586 /* Find good prototype style formal argument lists for all of the function
2587 declarations which didn't have them before now.
2589 To do this we consider each function name one at a time. For each function
2590 name, we look at the items on the linked list of def_dec_info records for
2591 that particular name.
2593 Somewhere on this list we should find one (and only one) def_dec_info
2594 record which represents the actual function definition, and this record
2595 should have a nice formal argument list already associated with it.
2597 Thus, all we have to do is to connect up all of the other def_dec_info
2598 records for this particular function name to the special one which has
2599 the full-blown formals list.
2601 Of course it is a little more complicated than just that. See below for
2605 connect_defs_and_decs (hp)
2606 const hash_table_entry *hp;
2608 const def_dec_info *dd_p;
2609 const def_dec_info *extern_def_p = NULL;
2610 int first_extern_reference = 1;
2612 /* Traverse the list of definitions and declarations for this particular
2613 function name. For each item on the list, if it is a function
2614 definition (either old style or new style) then GCC has already been
2615 kind enough to produce a prototype for us, and it is associated with
2616 the item already, so declare the item as its own associated "definition".
2618 Also, for each item which is only a function declaration, but which
2619 nonetheless has its own prototype already (obviously supplied by the user)
2620 declare the item as it's own definition.
2622 Note that when/if there are multiple user-supplied prototypes already
2623 present for multiple declarations of any given function, these multiple
2624 prototypes *should* all match exactly with one another and with the
2625 prototype for the actual function definition. We don't check for this
2626 here however, since we assume that the compiler must have already done
2627 this consistency checking when it was creating the .X files. */
2629 for (dd_p = hp->ddip; dd_p; dd_p = dd_p->next_for_func)
2630 if (dd_p->prototyped)
2631 ((NONCONST def_dec_info *) dd_p)->definition = dd_p;
2633 /* Traverse the list of definitions and declarations for this particular
2634 function name. For each item on the list, if it is an extern function
2635 declaration and if it has no associated definition yet, go try to find
2636 the matching extern definition for the declaration.
2638 When looking for the matching function definition, warn the user if we
2641 If we find more that one function definition also issue a warning.
2643 Do the search for the matching definition only once per unique function
2644 name (and only when absolutely needed) so that we can avoid putting out
2645 redundant warning messages, and so that we will only put out warning
2646 messages when there is actually a reference (i.e. a declaration) for
2647 which we need to find a matching definition. */
2649 for (dd_p = hp->ddip; dd_p; dd_p = dd_p->next_for_func)
2650 if (!dd_p->is_func_def && !dd_p->is_static && !dd_p->definition)
2652 if (first_extern_reference)
2654 extern_def_p = find_extern_def (hp->ddip, dd_p);
2655 first_extern_reference = 0;
2657 ((NONCONST def_dec_info *) dd_p)->definition = extern_def_p;
2660 /* Traverse the list of definitions and declarations for this particular
2661 function name. For each item on the list, if it is a static function
2662 declaration and if it has no associated definition yet, go try to find
2663 the matching static definition for the declaration within the same file.
2665 When looking for the matching function definition, warn the user if we
2666 fail to find one in the same file with the declaration, and refuse to
2667 convert this kind of cross-file static function declaration. After all,
2668 this is stupid practice and should be discouraged.
2670 We don't have to worry about the possibility that there is more than one
2671 matching function definition in the given file because that would have
2672 been flagged as an error by the compiler.
2674 Do the search for the matching definition only once per unique
2675 function-name/source-file pair (and only when absolutely needed) so that
2676 we can avoid putting out redundant warning messages, and so that we will
2677 only put out warning messages when there is actually a reference (i.e. a
2678 declaration) for which we actually need to find a matching definition. */
2680 for (dd_p = hp->ddip; dd_p; dd_p = dd_p->next_for_func)
2681 if (!dd_p->is_func_def && dd_p->is_static && !dd_p->definition)
2683 const def_dec_info *dd_p2;
2684 const def_dec_info *static_def;
2686 /* We have now found a single static declaration for which we need to
2687 find a matching definition. We want to minimize the work (and the
2688 number of warnings), so we will find an appropriate (matching)
2689 static definition for this declaration, and then distribute it
2690 (as the definition for) any and all other static declarations
2691 for this function name which occur within the same file, and which
2692 do not already have definitions.
2694 Note that a trick is used here to prevent subsequent attempts to
2695 call find_static_definition for a given function-name & file
2696 if the first such call returns NULL. Essentially, we convert
2697 these NULL return values to -1, and put the -1 into the definition
2698 field for each other static declaration from the same file which
2699 does not already have an associated definition.
2700 This makes these other static declarations look like they are
2701 actually defined already when the outer loop here revisits them
2702 later on. Thus, the outer loop will skip over them. Later, we
2703 turn the -1's back to NULL's. */
2705 ((NONCONST def_dec_info *) dd_p)->definition =
2706 (static_def = find_static_definition (dd_p))
2708 : (const def_dec_info *) -1;
2710 for (dd_p2 = dd_p->next_for_func; dd_p2; dd_p2 = dd_p2->next_for_func)
2711 if (!dd_p2->is_func_def && dd_p2->is_static
2712 && !dd_p2->definition && (dd_p2->file == dd_p->file))
2713 ((NONCONST def_dec_info *)dd_p2)->definition = dd_p->definition;
2716 /* Convert any dummy (-1) definitions we created in the step above back to
2717 NULL's (as they should be). */
2719 for (dd_p = hp->ddip; dd_p; dd_p = dd_p->next_for_func)
2720 if (dd_p->definition == (def_dec_info *) -1)
2721 ((NONCONST def_dec_info *) dd_p)->definition = NULL;
2724 #endif /* !defined (UNPROTOIZE) */
2726 /* Give a pointer into the clean text buffer, return a number which is the
2727 original source line number that the given pointer points into. */
2730 identify_lineno (clean_p)
2731 const char *clean_p;
2736 for (scan_p = clean_text_base; scan_p <= clean_p; scan_p++)
2737 if (*scan_p == '\n')
2742 /* Issue an error message and give up on doing this particular edit. */
2745 declare_source_confusing (clean_p)
2746 const char *clean_p;
2751 fprintf (stderr, "%s: %d: warning: source too confusing\n",
2752 shortpath (NULL, convert_filename), last_known_line_number);
2754 fprintf (stderr, "%s: %d: warning: source too confusing\n",
2755 shortpath (NULL, convert_filename),
2756 identify_lineno (clean_p));
2758 longjmp (source_confusion_recovery, 1);
2761 /* Check that a condition which is expected to be true in the original source
2762 code is in fact true. If not, issue an error message and give up on
2763 converting this particular source file. */
2766 check_source (cond, clean_p)
2768 const char *clean_p;
2771 declare_source_confusing (clean_p);
2774 /* If we think of the in-core cleaned text buffer as a memory mapped
2775 file (with the variable last_known_line_start acting as sort of a
2776 file pointer) then we can imagine doing "seeks" on the buffer. The
2777 following routine implements a kind of "seek" operation for the in-core
2778 (cleaned) copy of the source file. When finished, it returns a pointer to
2779 the start of a given (numbered) line in the cleaned text buffer.
2781 Note that protoize only has to "seek" in the forward direction on the
2782 in-core cleaned text file buffers, and it never needs to back up.
2784 This routine is made a little bit faster by remembering the line number
2785 (and pointer value) supplied (and returned) from the previous "seek".
2786 This prevents us from always having to start all over back at the top
2787 of the in-core cleaned buffer again. */
2793 if (n < last_known_line_number)
2796 while (n > last_known_line_number)
2798 while (*last_known_line_start != '\n')
2799 check_source (++last_known_line_start < clean_text_limit, 0);
2800 last_known_line_start++;
2801 last_known_line_number++;
2803 return last_known_line_start;
2806 /* Given a pointer to a character in the cleaned text buffer, return a pointer
2807 to the next non-whitepace character which follows it. */
2810 forward_to_next_token_char (ptr)
2813 for (++ptr; isspace (*ptr); check_source (++ptr < clean_text_limit, 0))
2818 /* Copy a chunk of text of length `len' and starting at `str' to the current
2819 output buffer. Note that all attempts to add stuff to the current output
2820 buffer ultimately go through here. */
2823 output_bytes (str, len)
2827 if ((repl_write_ptr + 1) + len >= repl_text_limit)
2829 size_t new_size = (repl_text_limit - repl_text_base) << 1;
2830 char *new_buf = (char *) xrealloc (repl_text_base, new_size);
2832 repl_write_ptr = new_buf + (repl_write_ptr - repl_text_base);
2833 repl_text_base = new_buf;
2834 repl_text_limit = new_buf + new_size;
2836 memcpy (repl_write_ptr + 1, str, len);
2837 repl_write_ptr += len;
2840 /* Copy all bytes (except the trailing null) of a null terminated string to
2841 the current output buffer. */
2847 output_bytes (str, strlen (str));
2850 /* Copy some characters from the original text buffer to the current output
2853 This routine takes a pointer argument `p' which is assumed to be a pointer
2854 into the cleaned text buffer. The bytes which are copied are the `original'
2855 equivalents for the set of bytes between the last value of `clean_read_ptr'
2856 and the argument value `p'.
2858 The set of bytes copied however, comes *not* from the cleaned text buffer,
2859 but rather from the direct counterparts of these bytes within the original
2862 Thus, when this function is called, some bytes from the original text
2863 buffer (which may include original comments and preprocessing directives)
2864 will be copied into the output buffer.
2866 Note that the request implide when this routine is called includes the
2867 byte pointed to by the argument pointer `p'. */
2873 size_t copy_length = (size_t) (p - clean_read_ptr);
2874 const char *copy_start = orig_text_base+(clean_read_ptr-clean_text_base)+1;
2876 if (copy_length == 0)
2879 output_bytes (copy_start, copy_length);
2883 /* Given a pointer to a def_dec_info record which represents some form of
2884 definition of a function (perhaps a real definition, or in lieu of that
2885 perhaps just a declaration with a full prototype) return true if this
2886 function is one which we should avoid converting. Return false
2890 other_variable_style_function (ansi_header)
2891 const char *ansi_header;
2895 /* See if we have a stdarg function, or a function which has stdarg style
2896 parameters or a stdarg style return type. */
2898 return (int) substr (ansi_header, "...");
2900 #else /* !defined (UNPROTOIZE) */
2902 /* See if we have a varargs function, or a function which has varargs style
2903 parameters or a varargs style return type. */
2906 int len = strlen (varargs_style_indicator);
2908 for (p = ansi_header; p; )
2910 const char *candidate;
2912 if ((candidate = substr (p, varargs_style_indicator)) == 0)
2915 if (!is_id_char (candidate[-1]) && !is_id_char (candidate[len]))
2921 #endif /* !defined (UNPROTOIZE) */
2924 /* Do the editing operation specifically for a function "declaration". Note
2925 that editing for function "definitions" are handled in a separate routine
2929 edit_fn_declaration (def_dec_p, clean_text_p)
2930 const def_dec_info *def_dec_p;
2931 const char *VOLATILE clean_text_p;
2933 const char *start_formals;
2934 const char *end_formals;
2935 const char *function_to_edit = def_dec_p->hash_entry->symbol;
2936 size_t func_name_len = strlen (function_to_edit);
2937 const char *end_of_fn_name;
2941 const f_list_chain_item *this_f_list_chain_item;
2942 const def_dec_info *definition = def_dec_p->definition;
2944 /* If we are protoizing, and if we found no corresponding definition for
2945 this particular function declaration, then just leave this declaration
2946 exactly as it is. */
2951 /* If we are protoizing, and if the corresponding definition that we found
2952 for this particular function declaration defined an old style varargs
2953 function, then we want to issue a warning and just leave this function
2954 declaration unconverted. */
2956 if (other_variable_style_function (definition->ansi_decl))
2959 fprintf (stderr, "%s: %d: warning: varargs function declaration not converted\n",
2960 shortpath (NULL, def_dec_p->file->hash_entry->symbol),
2965 #endif /* !defined (UNPROTOIZE) */
2967 /* Setup here to recover from confusing source code detected during this
2968 particular "edit". */
2971 if (setjmp (source_confusion_recovery))
2973 restore_pointers ();
2974 fprintf (stderr, "%s: declaration of function `%s' not converted\n",
2975 pname, function_to_edit);
2979 /* We are editing a function declaration. The line number we did a seek to
2980 contains the comma or semicolon which follows the declaration. Our job
2981 now is to scan backwards looking for the function name. This name *must*
2982 be followed by open paren (ignoring whitespace, of course). We need to
2983 replace everything between that open paren and the corresponding closing
2984 paren. If we are protoizing, we need to insert the prototype-style
2985 formals lists. If we are unprotoizing, we need to just delete everything
2986 between the pairs of opening and closing parens. */
2988 /* First move up to the end of the line. */
2990 while (*clean_text_p != '\n')
2991 check_source (++clean_text_p < clean_text_limit, 0);
2992 clean_text_p--; /* Point to just before the newline character. */
2994 /* Now we can scan backwards for the function name. */
3000 /* Scan leftwards until we find some character which can be
3001 part of an identifier. */
3003 while (!is_id_char (*clean_text_p))
3004 check_source (--clean_text_p > clean_read_ptr, 0);
3006 /* Scan backwards until we find a char that cannot be part of an
3009 while (is_id_char (*clean_text_p))
3010 check_source (--clean_text_p > clean_read_ptr, 0);
3012 /* Having found an "id break", see if the following id is the one
3013 that we are looking for. If so, then exit from this loop. */
3015 if (!strncmp (clean_text_p+1, function_to_edit, func_name_len))
3017 char ch = *(clean_text_p + 1 + func_name_len);
3019 /* Must also check to see that the name in the source text
3020 ends where it should (in order to prevent bogus matches
3021 on similar but longer identifiers. */
3023 if (! is_id_char (ch))
3024 break; /* exit from loop */
3028 /* We have now found the first perfect match for the function name in
3029 our backward search. This may or may not be the actual function
3030 name at the start of the actual function declaration (i.e. we could
3031 have easily been mislead). We will try to avoid getting fooled too
3032 often by looking forward for the open paren which should follow the
3033 identifier we just found. We ignore whitespace while hunting. If
3034 the next non-whitespace byte we see is *not* an open left paren,
3035 then we must assume that we have been fooled and we start over
3036 again accordingly. Note that there is no guarrantee, that even if
3037 we do see the open paren, that we are in the right place.
3038 Programmers do the strangest things sometimes! */
3040 end_of_fn_name = clean_text_p + strlen (def_dec_p->hash_entry->symbol);
3041 start_formals = forward_to_next_token_char (end_of_fn_name);
3043 while (*start_formals != '(');
3045 /* start_of_formals now points to the opening left paren which immediately
3046 follows the name of the function. */
3048 /* Note that there may be several formals lists which need to be modified
3049 due to the possibility that the return type of this function is a
3050 pointer-to-function type. If there are several formals lists, we
3051 convert them in left-to-right order here. */
3054 this_f_list_chain_item = definition->f_list_chain;
3055 #endif /* !defined (UNPROTOIZE) */
3062 end_formals = start_formals + 1;
3064 for (; depth; check_source (++end_formals < clean_text_limit, 0))
3066 switch (*end_formals)
3079 /* end_formals now points to the closing right paren of the formals
3080 list whose left paren is pointed to by start_formals. */
3082 /* Now, if we are protoizing, we insert the new ANSI-style formals list
3083 attached to the associated definition of this function. If however
3084 we are unprotoizing, then we simply delete any formals list which
3087 output_up_to (start_formals);
3089 if (this_f_list_chain_item)
3091 output_string (this_f_list_chain_item->formals_list);
3092 this_f_list_chain_item = this_f_list_chain_item->chain_next;
3097 fprintf (stderr, "%s: warning: too many parameter lists in declaration of `%s'\n",
3098 pname, def_dec_p->hash_entry->symbol);
3099 check_source (0, end_formals); /* leave the declaration intact */
3101 #endif /* !defined (UNPROTOIZE) */
3102 clean_read_ptr = end_formals - 1;
3104 /* Now see if it looks like there may be another formals list associated
3105 with the function declaration that we are converting (following the
3106 formals list that we just converted. */
3109 const char *another_r_paren = forward_to_next_token_char (end_formals);
3111 if ((*another_r_paren != ')')
3112 || (*(start_formals = forward_to_next_token_char (another_r_paren)) != '('))
3115 if (this_f_list_chain_item)
3118 fprintf (stderr, "\n%s: warning: too few parameter lists in declaration of `%s'\n",
3119 pname, def_dec_p->hash_entry->symbol);
3120 check_source (0, start_formals); /* leave the decl intact */
3122 #endif /* !defined (UNPROTOIZE) */
3128 /* There does appear to be yet another formals list, so loop around
3129 again, and convert it also. */
3133 /* Edit a whole group of formals lists, starting with the rightmost one
3134 from some set of formals lists. This routine is called once (from the
3135 outside) for each function declaration which is converted. It is
3136 recursive however, and it calls itself once for each remaining formal
3137 list that lies to the left of the one it was originally called to work
3138 on. Thus, a whole set gets done in right-to-left order.
3140 This routine returns non-zero if it thinks that it should not be trying
3141 to convert this particular function definition (because the name of the
3142 function doesn't match the one expected). */
3145 edit_formals_lists (end_formals, f_list_count, def_dec_p)
3146 const char *end_formals;
3147 unsigned int f_list_count;
3148 const def_dec_info *def_dec_p;
3150 const char *start_formals;
3153 start_formals = end_formals - 1;
3155 for (; depth; check_source (--start_formals > clean_read_ptr, 0))
3157 switch (*start_formals)
3169 /* start_formals now points to the opening left paren of the formals list. */
3175 const char *next_end;
3177 /* There should be more formal lists to the left of here. */
3179 next_end = start_formals - 1;
3180 check_source (next_end > clean_read_ptr, 0);
3181 while (isspace (*next_end))
3182 check_source (--next_end > clean_read_ptr, 0);
3183 check_source (*next_end == ')', next_end);
3184 check_source (--next_end > clean_read_ptr, 0);
3185 check_source (*next_end == ')', next_end);
3186 if (edit_formals_lists (next_end, f_list_count, def_dec_p))
3190 /* Check that the function name in the header we are working on is the same
3191 as the one we would expect to find. If not, issue a warning and return
3194 if (f_list_count == 0)
3196 const char *expected = def_dec_p->hash_entry->symbol;
3197 const char *func_name_start;
3198 const char *func_name_limit;
3199 size_t func_name_len;
3201 for (func_name_limit = start_formals-1; isspace (*func_name_limit); )
3202 check_source (--func_name_limit > clean_read_ptr, 0);
3204 for (func_name_start = func_name_limit++;
3205 is_id_char (*func_name_start);
3207 check_source (func_name_start > clean_read_ptr, 0);
3209 func_name_len = func_name_limit - func_name_start;
3210 if (func_name_len == 0)
3211 check_source (0, func_name_start);
3212 if (func_name_len != strlen (expected)
3213 || strncmp (func_name_start, expected, func_name_len))
3215 fprintf (stderr, "%s: %d: warning: found `%s' but expected `%s'\n",
3216 shortpath (NULL, def_dec_p->file->hash_entry->symbol),
3217 identify_lineno (func_name_start),
3218 dupnstr (func_name_start, func_name_len),
3224 output_up_to (start_formals);
3227 if (f_list_count == 0)
3228 output_string (def_dec_p->formal_names);
3229 #else /* !defined (UNPROTOIZE) */
3231 unsigned f_list_depth;
3232 const f_list_chain_item *flci_p = def_dec_p->f_list_chain;
3234 /* At this point, the current value of f_list count says how many
3235 links we have to follow through the f_list_chain to get to the
3236 particular formals list that we need to output next. */
3238 for (f_list_depth = 0; f_list_depth < f_list_count; f_list_depth++)
3239 flci_p = flci_p->chain_next;
3240 output_string (flci_p->formals_list);
3242 #endif /* !defined (UNPROTOIZE) */
3244 clean_read_ptr = end_formals - 1;
3248 /* Given a pointer to a byte in the clean text buffer which points to the
3249 beginning of a line that contains a "follower" token for a function
3250 definition header, do whatever is necessary to find the right closing
3251 paren for the rightmost formals list of the function definition header.
3255 find_rightmost_formals_list (clean_text_p)
3256 const char *clean_text_p;
3258 const char *end_formals;
3260 /* We are editing a function definition. The line number we did a seek
3261 to contains the first token which immediately follows the entire set of
3262 formals lists which are part of this particular function definition
3265 Our job now is to scan leftwards in the clean text looking for the
3266 right-paren which is at the end of the function header's rightmost
3269 If we ignore whitespace, this right paren should be the first one we
3270 see which is (ignoring whitespace) immediately followed either by the
3271 open curly-brace beginning the function body or by an alphabetic
3272 character (in the case where the function definition is in old (K&R)
3273 style and there are some declarations of formal parameters). */
3275 /* It is possible that the right paren we are looking for is on the
3276 current line (together with its following token). Just in case that
3277 might be true, we start out here by skipping down to the right end of
3278 the current line before starting our scan. */
3280 for (end_formals = clean_text_p; *end_formals != '\n'; end_formals++)
3286 /* Now scan backwards while looking for the right end of the rightmost
3287 formals list associated with this function definition. */
3291 const char *l_brace_p;
3293 /* Look leftward and try to find a right-paren. */
3295 while (*end_formals != ')')
3297 if (isspace (*end_formals))
3298 while (isspace (*end_formals))
3299 check_source (--end_formals > clean_read_ptr, 0);
3301 check_source (--end_formals > clean_read_ptr, 0);
3304 ch = *(l_brace_p = forward_to_next_token_char (end_formals));
3305 /* Since we are unprotoizing an ANSI-style (prototyped) function
3306 definition, there had better not be anything (except whitespace)
3307 between the end of the ANSI formals list and the beginning of the
3308 function body (i.e. the '{'). */
3310 check_source (ch == '{', l_brace_p);
3313 #else /* !defined (UNPROTOIZE) */
3315 /* Now scan backwards while looking for the right end of the rightmost
3316 formals list associated with this function definition. */
3321 const char *l_brace_p;
3323 /* Look leftward and try to find a right-paren. */
3325 while (*end_formals != ')')
3327 if (isspace (*end_formals))
3328 while (isspace (*end_formals))
3329 check_source (--end_formals > clean_read_ptr, 0);
3331 check_source (--end_formals > clean_read_ptr, 0);
3334 ch = *(l_brace_p = forward_to_next_token_char (end_formals));
3336 /* Since it is possible that we found a right paren before the starting
3337 '{' of the body which IS NOT the one at the end of the real K&R
3338 formals list (say for instance, we found one embedded inside one of
3339 the old K&R formal parameter declarations) we have to check to be
3340 sure that this is in fact the right paren that we were looking for.
3342 The one we were looking for *must* be followed by either a '{' or
3343 by an alphabetic character, while others *cannot* legally be followed
3344 by such characters. */
3346 if ((ch == '{') || isalpha (ch))
3349 /* At this point, we have found a right paren, but we know that it is
3350 not the one we were looking for, so backup one character and keep
3353 check_source (--end_formals > clean_read_ptr, 0);
3356 #endif /* !defined (UNPROTOIZE) */
3363 /* Insert into the output file a totally new declaration for a function
3364 which (up until now) was being called from within the current block
3365 without having been declared at any point such that the declaration
3366 was visible (i.e. in scope) at the point of the call.
3368 We need to add in explicit declarations for all such function calls
3369 in order to get the full benefit of prototype-based function call
3370 parameter type checking. */
3373 add_local_decl (def_dec_p, clean_text_p)
3374 const def_dec_info *def_dec_p;
3375 const char *clean_text_p;
3377 const char *start_of_block;
3378 const char *function_to_edit = def_dec_p->hash_entry->symbol;
3380 /* Don't insert new local explicit declarations unless explicitly requested
3386 /* Setup here to recover from confusing source code detected during this
3387 particular "edit". */
3390 if (setjmp (source_confusion_recovery))
3392 restore_pointers ();
3393 fprintf (stderr, "%s: local declaration for function `%s' not inserted\n",
3394 pname, function_to_edit);
3398 /* We have already done a seek to the start of the line which should
3399 contain *the* open curly brace which begins the block in which we need
3400 to insert an explicit function declaration (to replace the implicit one).
3402 Now we scan that line, starting from the left, until we find the
3403 open curly brace we are looking for. Note that there may actually be
3404 multiple open curly braces on the given line, but we will be happy
3405 with the leftmost one no matter what. */
3407 start_of_block = clean_text_p;
3408 while (*start_of_block != '{' && *start_of_block != '\n')
3409 check_source (++start_of_block < clean_text_limit, 0);
3411 /* Note that the line from the original source could possibly
3412 contain *no* open curly braces! This happens if the line contains
3413 a macro call which expands into a chunk of text which includes a
3414 block (and that block's associated open and close curly braces).
3415 In cases like this, we give up, issue a warning, and do nothing. */
3417 if (*start_of_block != '{')
3421 "\n%s: %d: warning: can't add declaration of `%s' into macro call\n",
3422 def_dec_p->file->hash_entry->symbol, def_dec_p->line,
3423 def_dec_p->hash_entry->symbol);
3427 /* Figure out what a nice (pretty) indentation would be for the new
3428 declaration we are adding. In order to do this, we must scan forward
3429 from the '{' until we find the first line which starts with some
3430 non-whitespace characters (i.e. real "token" material). */
3433 const char *ep = forward_to_next_token_char (start_of_block) - 1;
3436 /* Now we have ep pointing at the rightmost byte of some existing indent
3437 stuff. At least that is the hope.
3439 We can now just scan backwards and find the left end of the existing
3440 indentation string, and then copy it to the output buffer. */
3442 for (sp = ep; isspace (*sp) && *sp != '\n'; sp--)
3445 /* Now write out the open { which began this block, and any following
3446 trash up to and including the last byte of the existing indent that
3451 /* Now we go ahead and insert the new declaration at this point.
3453 If the definition of the given function is in the same file that we
3454 are currently editing, and if its full ANSI declaration normally
3455 would start with the keyword `extern', suppress the `extern'. */
3458 const char *decl = def_dec_p->definition->ansi_decl;
3460 if ((*decl == 'e') && (def_dec_p->file == def_dec_p->definition->file))
3462 output_string (decl);
3465 /* Finally, write out a new indent string, just like the preceding one
3466 that we found. This will typically include a newline as the first
3467 character of the indent string. */
3469 output_bytes (sp, (size_t) (ep - sp) + 1);
3473 /* Given a pointer to a file_info record, and a pointer to the beginning
3474 of a line (in the clean text buffer) which is assumed to contain the
3475 first "follower" token for the first function definition header in the
3476 given file, find a good place to insert some new global function
3477 declarations (which will replace scattered and imprecise implicit ones)
3478 and then insert the new explicit declaration at that point in the file. */
3481 add_global_decls (file_p, clean_text_p)
3482 const file_info *file_p;
3483 const char *clean_text_p;
3485 const def_dec_info *dd_p;
3488 /* Setup here to recover from confusing source code detected during this
3489 particular "edit". */
3492 if (setjmp (source_confusion_recovery))
3494 restore_pointers ();
3495 fprintf (stderr, "%s: global declarations for file `%s' not inserted\n",
3496 pname, shortpath (NULL, file_p->hash_entry->symbol));
3500 /* Start by finding a good location for adding the new explicit function
3501 declarations. To do this, we scan backwards, ignoring whitespace
3502 and comments and other junk until we find either a semicolon, or until
3503 we hit the beginning of the file. */
3505 scan_p = find_rightmost_formals_list (clean_text_p);
3508 if (scan_p < clean_text_base)
3510 check_source (scan_p > clean_read_ptr, 0);
3515 /* scan_p now points either to a semicolon, or to just before the start
3516 of the whole file. */
3518 /* Now scan forward for the first non-whitespace character. In theory,
3519 this should be the first character of the following function definition
3520 header. We will put in the added declarations just prior to that. */
3523 while (isspace (*scan_p))
3527 output_up_to (scan_p);
3529 /* Now write out full prototypes for all of the things that had been
3530 implicitly declared in this file (but only those for which we were
3531 actually able to find unique matching definitions). Avoid duplicates
3532 by marking things that we write out as we go. */
3535 int some_decls_added = 0;
3537 for (dd_p = file_p->defs_decs; dd_p; dd_p = dd_p->next_in_file)
3538 if (dd_p->is_implicit && dd_p->definition && !dd_p->definition->written)
3540 const char *decl = dd_p->definition->ansi_decl;
3542 /* If the function for which we are inserting a declaration is
3543 actually defined later in the same file, then suppress the
3544 leading `extern' keyword (if there is one). */
3546 if (*decl == 'e' && (dd_p->file == dd_p->definition->file))
3549 output_string ("\n");
3550 output_string (decl);
3551 some_decls_added = 1;
3552 ((NONCONST def_dec_info *) dd_p->definition)->written = 1;
3554 if (some_decls_added)
3555 output_string ("\n\n");
3558 /* Unmark all of the definitions that we just marked. */
3560 for (dd_p = file_p->defs_decs; dd_p; dd_p = dd_p->next_in_file)
3561 if (dd_p->definition)
3562 ((NONCONST def_dec_info *) dd_p->definition)->written = 0;
3565 #endif /* !defined (UNPROTOIZE) */
3567 /* Do the editing operation specifically for a function "definition". Note
3568 that editing operations for function "declarations" are handled by a
3569 separate routine above. */
3572 edit_fn_definition (def_dec_p, clean_text_p)
3573 const def_dec_info *def_dec_p;
3574 const char *clean_text_p;
3576 const char *end_formals;
3577 const char *function_to_edit = def_dec_p->hash_entry->symbol;
3579 /* Setup here to recover from confusing source code detected during this
3580 particular "edit". */
3583 if (setjmp (source_confusion_recovery))
3585 restore_pointers ();
3586 fprintf (stderr, "%s: definition of function `%s' not converted\n",
3587 pname, function_to_edit);
3591 end_formals = find_rightmost_formals_list (clean_text_p);
3593 /* end_of_formals now points to the closing right paren of the rightmost
3594 formals list which is actually part of the `header' of the function
3595 definition that we are converting. */
3597 /* If the header of this function definition looks like it declares a
3598 function with a variable number of arguments, and if the way it does
3599 that is different from that way we would like it (i.e. varargs vs.
3600 stdarg) then issue a warning and leave the header unconverted. */
3602 if (other_variable_style_function (def_dec_p->ansi_decl))
3605 fprintf (stderr, "%s: %d: warning: definition of %s not converted\n",
3606 shortpath (NULL, def_dec_p->file->hash_entry->symbol),
3607 identify_lineno (end_formals),
3609 output_up_to (end_formals);
3613 if (edit_formals_lists (end_formals, def_dec_p->f_list_count, def_dec_p))
3615 restore_pointers ();
3616 fprintf (stderr, "%s: definition of function `%s' not converted\n",
3617 pname, function_to_edit);
3621 /* Have to output the last right paren because this never gets flushed by
3622 edit_formals_list. */
3624 output_up_to (end_formals);
3629 const char *semicolon_p;
3630 const char *limit_p;
3632 int had_newlines = 0;
3634 /* Now write out the K&R style formal declarations, one per line. */
3636 decl_p = def_dec_p->formal_decls;
3637 limit_p = decl_p + strlen (decl_p);
3638 for (;decl_p < limit_p; decl_p = semicolon_p + 2)
3640 for (semicolon_p = decl_p; *semicolon_p != ';'; semicolon_p++)
3642 output_string ("\n");
3643 output_string (indent_string);
3644 output_bytes (decl_p, (size_t) ((semicolon_p + 1) - decl_p));
3647 /* If there are no newlines between the end of the formals list and the
3648 start of the body, we should insert one now. */
3650 for (scan_p = end_formals+1; *scan_p != '{'; )
3652 if (*scan_p == '\n')
3657 check_source (++scan_p < clean_text_limit, 0);
3660 output_string ("\n");
3662 #else /* !defined (UNPROTOIZE) */
3663 /* If we are protoizing, there may be some flotsum & jetsum (like comments
3664 and preprocessing directives) after the old formals list but before
3665 the following { and we would like to preserve that stuff while effectively
3666 deleting the existing K&R formal parameter declarations. We do so here
3667 in a rather tricky way. Basically, we white out any stuff *except*
3668 the comments/pp-directives in the original text buffer, then, if there
3669 is anything in this area *other* than whitespace, we output it. */
3671 const char *end_formals_orig;
3672 const char *start_body;
3673 const char *start_body_orig;
3675 const char *scan_orig;
3676 int have_flotsum = 0;
3677 int have_newlines = 0;
3679 for (start_body = end_formals + 1; *start_body != '{';)
3680 check_source (++start_body < clean_text_limit, 0);
3682 end_formals_orig = orig_text_base + (end_formals - clean_text_base);
3683 start_body_orig = orig_text_base + (start_body - clean_text_base);
3684 scan = end_formals + 1;
3685 scan_orig = end_formals_orig + 1;
3686 for (; scan < start_body; scan++, scan_orig++)
3688 if (*scan == *scan_orig)
3690 have_newlines |= (*scan_orig == '\n');
3691 /* Leave identical whitespace alone. */
3692 if (!isspace (*scan_orig))
3693 *((NONCONST char *)scan_orig) = ' '; /* identical - so whiteout */
3699 output_bytes (end_formals_orig + 1,
3700 (size_t) (start_body_orig - end_formals_orig) - 1);
3703 output_string ("\n");
3705 output_string (" ");
3706 clean_read_ptr = start_body - 1;
3708 #endif /* !defined (UNPROTOIZE) */
3711 /* Clean up the clean text buffer. Do this by converting comments and
3712 preprocessor directives into spaces. Also convert line continuations
3713 into whitespace. Also, whiteout string and character literals. */
3716 do_cleaning (new_clean_text_base, new_clean_text_limit)
3717 char *new_clean_text_base;
3718 char *new_clean_text_limit;
3721 int non_whitespace_since_newline = 0;
3723 for (scan_p = new_clean_text_base; scan_p < new_clean_text_limit; scan_p++)
3727 case '/': /* Handle comments. */
3728 if (scan_p[1] != '*')
3730 non_whitespace_since_newline = 1;
3734 while (scan_p[1] != '/' || scan_p[0] != '*')
3736 if (!isspace (*scan_p))
3738 if (++scan_p >= new_clean_text_limit)
3745 case '#': /* Handle pp directives. */
3746 if (non_whitespace_since_newline)
3749 while (scan_p[1] != '\n' || scan_p[0] == '\\')
3751 if (!isspace (*scan_p))
3753 if (++scan_p >= new_clean_text_limit)
3759 case '\'': /* Handle character literals. */
3760 non_whitespace_since_newline = 1;
3761 while (scan_p[1] != '\'' || scan_p[0] == '\\')
3763 if (scan_p[0] == '\\' && !isspace (scan_p[1]))
3765 if (!isspace (*scan_p))
3767 if (++scan_p >= new_clean_text_limit)
3773 case '"': /* Handle string literals. */
3774 non_whitespace_since_newline = 1;
3775 while (scan_p[1] != '"' || scan_p[0] == '\\')
3777 if (scan_p[0] == '\\' && !isspace (scan_p[1]))
3779 if (!isspace (*scan_p))
3781 if (++scan_p >= new_clean_text_limit)
3787 case '\\': /* Handle line continuations. */
3788 if (scan_p[1] != '\n')
3794 non_whitespace_since_newline = 0; /* Reset. */
3803 break; /* Whitespace characters. */
3807 non_whitespace_since_newline = 1;
3813 /* Given a pointer to the closing right parenthesis for a particular formals
3814 list (in the clean text buffer) find the corresponding left parenthesis
3815 and return a pointer to it. */
3818 careful_find_l_paren (p)
3824 for (paren_depth = 1, q = p-1; paren_depth; check_source (--q >= clean_text_base, 0))
3839 /* Scan the clean text buffer for cases of function definitions that we
3840 don't really know about because they were preprocessed out when the
3841 aux info files were created.
3843 In this version of protoize/unprotoize we just give a warning for each
3844 one found. A later version may be able to at least unprotoize such
3847 Note that we may easily find all function definitions simply by
3848 looking for places where there is a left paren which is (ignoring
3849 whitespace) immediately followed by either a left-brace or by an
3850 upper or lower case letter. Whenever we find this combination, we
3851 have also found a function definition header.
3853 Finding function *declarations* using syntactic clues is much harder.
3854 I will probably try to do this in a later version though. */
3857 scan_for_missed_items (file_p)
3858 const file_info *file_p;
3860 static const char *scan_p;
3861 const char *limit = clean_text_limit - 3;
3862 static const char *backup_limit;
3864 backup_limit = clean_text_base - 1;
3866 for (scan_p = clean_text_base; scan_p < limit; scan_p++)
3870 static const char *last_r_paren;
3871 const char *ahead_p;
3873 last_r_paren = scan_p;
3875 for (ahead_p = scan_p + 1; isspace (*ahead_p); )
3876 check_source (++ahead_p < limit, limit);
3878 scan_p = ahead_p - 1;
3880 if (isalpha (*ahead_p) || *ahead_p == '{')
3882 const char *last_l_paren;
3883 const int lineno = identify_lineno (ahead_p);
3885 if (setjmp (source_confusion_recovery))
3888 /* We know we have a function definition header. Now skip
3889 leftwards over all of its associated formals lists. */
3893 last_l_paren = careful_find_l_paren (last_r_paren);
3894 for (last_r_paren = last_l_paren-1; isspace (*last_r_paren); )
3895 check_source (--last_r_paren >= backup_limit, backup_limit);
3897 while (*last_r_paren == ')');
3899 if (is_id_char (*last_r_paren))
3901 const char *id_limit = last_r_paren + 1;
3902 const char *id_start;
3904 const def_dec_info *dd_p;
3906 for (id_start = id_limit-1; is_id_char (*id_start); )
3907 check_source (--id_start >= backup_limit, backup_limit);
3909 backup_limit = id_start;
3910 if ((id_length = (size_t) (id_limit - id_start)) == 0)
3914 char *func_name = (char *) alloca (id_length + 1);
3915 static const char * const stmt_keywords[]
3916 = { "if", "while", "for", "switch", "return", 0 };
3917 const char * const *stmt_keyword;
3919 strncpy (func_name, id_start, id_length);
3920 func_name[id_length] = '\0';
3922 /* We must check here to see if we are actually looking at
3923 a statement rather than an actual function call. */
3925 for (stmt_keyword = stmt_keywords; *stmt_keyword; stmt_keyword++)
3926 if (!strcmp (func_name, *stmt_keyword))
3930 fprintf (stderr, "%s: found definition of `%s' at %s(%d)\n",
3933 shortpath (NULL, file_p->hash_entry->symbol),
3934 identify_lineno (id_start));
3936 /* We really should check for a match of the function name
3937 here also, but why bother. */
3939 for (dd_p = file_p->defs_decs; dd_p; dd_p = dd_p->next_in_file)
3940 if (dd_p->is_func_def && dd_p->line == lineno)
3943 /* If we make it here, then we did not know about this
3944 function definition. */
3946 fprintf (stderr, "%s: %d: warning: `%s' was #if 0\n",
3947 shortpath (NULL, file_p->hash_entry->symbol),
3948 identify_lineno (id_start), func_name);
3949 fprintf (stderr, "%s: function definition not converted\n",
3959 /* Do all editing operations for a single source file (either a "base" file
3960 or an "include" file). To do this we read the file into memory, keep a
3961 virgin copy there, make another cleaned in-core copy of the original file
3962 (i.e. one in which all of the comments and preprocessor directives have
3963 been replaced with whitespace), then use these two in-core copies of the
3964 file to make a new edited in-core copy of the file. Finally, rename the
3965 original file (as a way of saving it), and then write the edited version
3966 of the file from core to a disk file of the same name as the original.
3968 Note that the trick of making a copy of the original sans comments &
3969 preprocessor directives make the editing a whole lot easier. */
3973 const hash_table_entry *hp;
3975 struct stat stat_buf;
3976 const file_info *file_p = hp->fip;
3977 char *new_orig_text_base;
3978 char *new_orig_text_limit;
3979 char *new_clean_text_base;
3980 char *new_clean_text_limit;
3983 int first_definition_in_file;
3985 /* If we are not supposed to be converting this file, or if there is
3986 nothing in there which needs converting, just skip this file. */
3988 if (!needs_to_be_converted (file_p))
3991 convert_filename = file_p->hash_entry->symbol;
3993 /* Convert a file if it is in a directory where we want conversion
3994 and the file is not excluded. */
3996 if (!directory_specified_p (convert_filename)
3997 || file_excluded_p (convert_filename))
4001 /* Don't even mention "system" include files unless we are
4002 protoizing. If we are protoizing, we mention these as a
4003 gentle way of prodding the user to convert his "system"
4004 include files to prototype format. */
4005 && !in_system_include_dir (convert_filename)
4006 #endif /* defined (UNPROTOIZE) */
4008 fprintf (stderr, "%s: file `%s' not converted\n",
4009 pname, shortpath (NULL, convert_filename));
4013 /* Let the user know what we are up to. */
4016 fprintf (stderr, "%s: would convert file `%s'\n",
4017 pname, shortpath (NULL, convert_filename));
4019 fprintf (stderr, "%s: converting file `%s'\n",
4020 pname, shortpath (NULL, convert_filename));
4023 /* Find out the size (in bytes) of the original file. */
4025 /* The cast avoids an erroneous warning on AIX. */
4026 if (my_stat ((char *)convert_filename, &stat_buf) == -1)
4028 fprintf (stderr, "%s: error: can't get status for file `%s': %s\n",
4029 pname, shortpath (NULL, convert_filename), sys_errlist[errno]);
4032 orig_size = stat_buf.st_size;
4034 /* Allocate a buffer to hold the original text. */
4036 orig_text_base = new_orig_text_base = (char *) xmalloc (orig_size + 2);
4037 orig_text_limit = new_orig_text_limit = new_orig_text_base + orig_size;
4039 /* Allocate a buffer to hold the cleaned-up version of the original text. */
4041 clean_text_base = new_clean_text_base = (char *) xmalloc (orig_size + 2);
4042 clean_text_limit = new_clean_text_limit = new_clean_text_base + orig_size;
4043 clean_read_ptr = clean_text_base - 1;
4045 /* Allocate a buffer that will hopefully be large enough to hold the entire
4046 converted output text. As an initial guess for the maximum size of the
4047 output buffer, use 125% of the size of the original + some extra. This
4048 buffer can be expanded later as needed. */
4050 repl_size = orig_size + (orig_size >> 2) + 4096;
4051 repl_text_base = (char *) xmalloc (repl_size + 2);
4052 repl_text_limit = repl_text_base + repl_size - 1;
4053 repl_write_ptr = repl_text_base - 1;
4058 /* Open the file to be converted in READ ONLY mode. */
4060 if ((input_file = my_open (convert_filename, O_RDONLY, 0444)) == -1)
4062 fprintf (stderr, "%s: error: can't open file `%s' for reading: %s\n",
4063 pname, shortpath (NULL, convert_filename),
4064 sys_errlist[errno]);
4068 /* Read the entire original source text file into the original text buffer
4069 in one swell fwoop. Then figure out where the end of the text is and
4070 make sure that it ends with a newline followed by a null. */
4072 if (read (input_file, new_orig_text_base, orig_size) != orig_size)
4075 fprintf (stderr, "\n%s: error: while reading input file `%s': %s\n",
4076 pname, shortpath (NULL, convert_filename),
4077 sys_errlist[errno]);
4084 if (orig_size == 0 || orig_text_limit[-1] != '\n')
4086 *new_orig_text_limit++ = '\n';
4090 /* Create the cleaned up copy of the original text. */
4092 memcpy (new_clean_text_base, orig_text_base,
4093 (size_t) (orig_text_limit - orig_text_base));
4094 do_cleaning (new_clean_text_base, new_clean_text_limit);
4099 size_t clean_size = orig_text_limit - orig_text_base;
4100 char *const clean_filename = (char *) alloca (strlen (convert_filename) + 6 + 1);
4102 /* Open (and create) the clean file. */
4104 strcpy (clean_filename, convert_filename);
4105 strcat (clean_filename, ".clean");
4106 if ((clean_file = creat (clean_filename, 0666)) == -1)
4108 fprintf (stderr, "%s: error: can't create/open clean file `%s': %s\n",
4109 pname, shortpath (NULL, clean_filename),
4110 sys_errlist[errno]);
4114 /* Write the clean file. */
4116 if (write (clean_file, new_clean_text_base, clean_size) != clean_size)
4117 fprintf (stderr, "%s: error: while writing file `%s': %s\n",
4118 pname, shortpath (NULL, clean_filename), sys_errlist[errno]);
4124 /* Do a simplified scan of the input looking for things that were not
4125 mentioned in the aux info files because of the fact that they were
4126 in a region of the source which was preprocessed-out (via #if or
4129 scan_for_missed_items (file_p);
4131 /* Setup to do line-oriented forward seeking in the clean text buffer. */
4133 last_known_line_number = 1;
4134 last_known_line_start = clean_text_base;
4136 /* Now get down to business and make all of the necessary edits. */
4139 const def_dec_info *def_dec_p;
4141 first_definition_in_file = 1;
4142 def_dec_p = file_p->defs_decs;
4143 for (; def_dec_p; def_dec_p = def_dec_p->next_in_file)
4145 const char *clean_text_p = seek_to_line (def_dec_p->line);
4147 /* clean_text_p now points to the first character of the line which
4148 contains the `terminator' for the declaration or definition that
4149 we are about to process. */
4153 if (global_flag && def_dec_p->is_func_def && first_definition_in_file)
4155 add_global_decls (def_dec_p->file, clean_text_p);
4156 first_definition_in_file = 0;
4159 /* Don't edit this item if it is already in prototype format or if it
4160 is a function declaration and we have found no corresponding
4163 if (def_dec_p->prototyped
4164 || (!def_dec_p->is_func_def && !def_dec_p->definition))
4167 #endif /* !defined (UNPROTOIZE) */
4169 if (def_dec_p->is_func_def)
4170 edit_fn_definition (def_dec_p, clean_text_p);
4173 if (def_dec_p->is_implicit)
4174 add_local_decl (def_dec_p, clean_text_p);
4176 #endif /* !defined (UNPROTOIZE) */
4177 edit_fn_declaration (def_dec_p, clean_text_p);
4181 /* Finalize things. Output the last trailing part of the original text. */
4183 output_up_to (clean_text_limit - 1);
4185 /* If this is just a test run, stop now and just deallocate the buffers. */
4189 free (new_orig_text_base);
4190 free (new_clean_text_base);
4191 free (repl_text_base);
4195 /* Change the name of the original input file. This is just a quick way of
4196 saving the original file. */
4200 char *new_filename =
4201 (char *) xmalloc (strlen (convert_filename) + strlen (save_suffix) + 2);
4203 strcpy (new_filename, convert_filename);
4204 strcat (new_filename, save_suffix);
4205 if (my_link (convert_filename, new_filename) == -1)
4207 if (errno == EEXIST)
4210 fprintf (stderr, "%s: warning: file `%s' already saved in `%s'\n",
4212 shortpath (NULL, convert_filename),
4213 shortpath (NULL, new_filename));
4217 fprintf (stderr, "%s: error: can't link file `%s' to `%s': %s\n",
4219 shortpath (NULL, convert_filename),
4220 shortpath (NULL, new_filename),
4221 sys_errlist[errno]);
4227 if (my_unlink (convert_filename) == -1)
4229 fprintf (stderr, "%s: error: can't delete file `%s': %s\n",
4230 pname, shortpath (NULL, convert_filename), sys_errlist[errno]);
4237 /* Open (and create) the output file. */
4239 if ((output_file = creat (convert_filename, 0666)) == -1)
4241 fprintf (stderr, "%s: error: can't create/open output file `%s': %s\n",
4242 pname, shortpath (NULL, convert_filename),
4243 sys_errlist[errno]);
4247 /* Write the output file. */
4250 unsigned int out_size = (repl_write_ptr + 1) - repl_text_base;
4252 if (write (output_file, repl_text_base, out_size) != out_size)
4253 fprintf (stderr, "%s: error: while writing file `%s': %s\n",
4254 pname, shortpath (NULL, convert_filename),
4255 sys_errlist[errno]);
4258 close (output_file);
4261 /* Deallocate the conversion buffers. */
4263 free (new_orig_text_base);
4264 free (new_clean_text_base);
4265 free (repl_text_base);
4267 /* Change the mode of the output file to match the original file. */
4269 /* The cast avoids an erroneous warning on AIX. */
4270 if (my_chmod ((char *)convert_filename, stat_buf.st_mode) == -1)
4271 fprintf (stderr, "%s: error: can't change mode of file `%s': %s\n",
4272 pname, shortpath (NULL, convert_filename), sys_errlist[errno]);
4274 /* Note: We would try to change the owner and group of the output file
4275 to match those of the input file here, except that may not be a good
4276 thing to do because it might be misleading. Also, it might not even
4277 be possible to do that (on BSD systems with quotas for instance). */
4280 /* Do all of the individual steps needed to do the protoization (or
4281 unprotoization) of the files referenced in the aux_info files given
4282 in the command line. */
4287 const char * const *base_pp;
4288 const char * const * const end_pps
4289 = &base_source_filenames[n_base_source_files];
4293 #endif /* !defined (UNPROTOIZE) */
4295 /* One-by-one, check (and create if necessary), open, and read all of the
4296 stuff in each aux_info file. After reading each aux_info file, the
4297 aux_info_file just read will be automatically deleted unless the
4298 keep_flag is set. */
4300 for (base_pp = base_source_filenames; base_pp < end_pps; base_pp++)
4301 process_aux_info_file (*base_pp, keep_flag, 0);
4305 /* Also open and read the special SYSCALLS.c aux_info file which gives us
4306 the prototypes for all of the standard system-supplied functions. */
4308 if (nondefault_syscalls_dir)
4310 syscalls_absolute_filename
4311 = (char *) xmalloc (strlen (nondefault_syscalls_dir)
4312 + sizeof (syscalls_filename) + 1);
4313 strcpy (syscalls_absolute_filename, nondefault_syscalls_dir);
4317 syscalls_absolute_filename
4318 = (char *) xmalloc (strlen (default_syscalls_dir)
4319 + sizeof (syscalls_filename) + 1);
4320 strcpy (syscalls_absolute_filename, default_syscalls_dir);
4323 syscalls_len = strlen (syscalls_absolute_filename);
4324 if (*(syscalls_absolute_filename + syscalls_len - 1) != '/')
4326 *(syscalls_absolute_filename + syscalls_len++) = '/';
4327 *(syscalls_absolute_filename + syscalls_len) = '\0';
4329 strcat (syscalls_absolute_filename, syscalls_filename);
4331 /* Call process_aux_info_file in such a way that it does not try to
4332 delete the SYSCALLS aux_info file. */
4334 process_aux_info_file (syscalls_absolute_filename, 1, 1);
4336 #endif /* !defined (UNPROTOIZE) */
4338 /* When we first read in all of the information from the aux_info files
4339 we saved in it decending line number order, because that was likely to
4340 be faster. Now however, we want the chains of def & dec records to
4341 appear in ascending line number order as we get further away from the
4342 file_info record that they hang from. The following line causes all of
4343 these lists to be rearranged into ascending line number order. */
4345 visit_each_hash_node (filename_primary, reverse_def_dec_list);
4349 /* Now do the "real" work. The following line causes each declaration record
4350 to be "visited". For each of these nodes, an attempt is made to match
4351 up the function declaration with a corresponding function definition,
4352 which should have a full prototype-format formals list with it. Once
4353 these match-ups are made, the conversion of the function declarations
4354 to prototype format can be made. */
4356 visit_each_hash_node (function_name_primary, connect_defs_and_decs);
4358 #endif /* !defined (UNPROTOIZE) */
4360 /* Now convert each file that can be converted (and needs to be). */
4362 visit_each_hash_node (filename_primary, edit_file);
4366 /* If we are working in cplusplus mode, try to rename all .c files to .C
4367 files. Don't panic if some of the renames don't work. */
4369 if (cplusplus_flag && !nochange_flag)
4370 visit_each_hash_node (filename_primary, rename_c_file);
4372 #endif /* !defined (UNPROTOIZE) */
4375 static struct option longopts[] =
4377 {"version", 0, 0, 'V'},
4378 {"file_name", 0, 0, 'p'},
4379 {"quiet", 0, 0, 'q'},
4380 {"silent", 0, 0, 'q'},
4381 {"force", 0, 0, 'f'},
4382 {"keep", 0, 0, 'k'},
4383 {"nosave", 0, 0, 'N'},
4384 {"nochange", 0, 0, 'n'},
4385 {"compiler-options", 1, 0, 'c'},
4386 {"exclude", 1, 0, 'x'},
4387 {"directory", 1, 0, 'd'},
4389 {"indent", 1, 0, 'i'},
4391 {"local", 0, 0, 'l'},
4392 {"global", 0, 0, 'g'},
4394 {"syscalls-dir", 1, 0, 'B'},
4408 pname = strrchr (argv[0], '/');
4409 pname = pname ? pname+1 : argv[0];
4411 /* Read the working directory, avoiding arbitrary limit. */
4412 size = GUESSPATHLEN;
4417 cwd_buffer = (char *) xmalloc (size);
4418 value = getcwd (cwd_buffer, size);
4419 if (value != 0 || errno != ERANGE)
4425 /* By default, convert the files in the current directory. */
4426 directory_list = string_list_cons (cwd_buffer, NULL);
4428 while ((c = getopt_long (argc, argv,
4432 "B:c:Cd:gklnNp:qVx:",
4434 longopts, &longind)) != EOF)
4436 if (c == 0) /* Long option. */
4437 c = longopts[longind].val;
4441 compiler_file_name = optarg;
4445 = string_list_cons (abspath (NULL, optarg), directory_list);
4448 exclude_list = string_list_cons (optarg, exclude_list);
4473 munge_compile_params (optarg);
4477 indent_string = optarg;
4479 #else /* !defined (UNPROTOIZE) */
4490 nondefault_syscalls_dir = optarg;
4492 #endif /* !defined (UNPROTOIZE) */
4498 n_base_source_files = argc - optind;
4500 /* Now actually make a list of the base source filenames. */
4502 base_source_filenames =
4503 (const char **) xmalloc ((n_base_source_files + 1) * sizeof (char *));
4504 n_base_source_files = 0;
4505 for (; optind < argc; optind++)
4507 const char *path = abspath (NULL, argv[optind]);
4508 int len = strlen (path);
4510 if (path[len-1] == 'c' && path[len-2] == '.')
4511 base_source_filenames[n_base_source_files++] = path;
4514 fprintf (stderr, "%s: input file names must have .c suffixes: %s\n",
4515 pname, shortpath (NULL, path));
4521 /* We are only interested in the very first identifier token in the
4522 definition of `va_list', so if there is more junk after that first
4523 identifier token, delete it from the `varargs_style_indicator'. */
4527 for (cp = varargs_style_indicator; isalnum (*cp) || *cp == '_'; cp++)
4530 varargs_style_indicator = savestring (varargs_style_indicator,
4531 cp - varargs_style_indicator);
4533 #endif /* !defined (UNPROTOIZE) */
4540 fprintf (stderr, "%s: %s\n", pname, version_string);