xref: /linux-6.15/scripts/basic/fixdep.c (revision bc6df812)
1 /*
2  * "Optimize" a list of dependencies as spit out by gcc -MD
3  * for the kernel build
4  * ===========================================================================
5  *
6  * Author       Kai Germaschewski
7  * Copyright    2002 by Kai Germaschewski  <[email protected]>
8  *
9  * This software may be used and distributed according to the terms
10  * of the GNU General Public License, incorporated herein by reference.
11  *
12  *
13  * Introduction:
14  *
15  * gcc produces a very nice and correct list of dependencies which
16  * tells make when to remake a file.
17  *
18  * To use this list as-is however has the drawback that virtually
19  * every file in the kernel includes autoconf.h.
20  *
21  * If the user re-runs make *config, autoconf.h will be
22  * regenerated.  make notices that and will rebuild every file which
23  * includes autoconf.h, i.e. basically all files. This is extremely
24  * annoying if the user just changed CONFIG_HIS_DRIVER from n to m.
25  *
26  * So we play the same trick that "mkdep" played before. We replace
27  * the dependency on autoconf.h by a dependency on every config
28  * option which is mentioned in any of the listed prerequisites.
29  *
30  * kconfig populates a tree in include/config/ with an empty file
31  * for each config symbol and when the configuration is updated
32  * the files representing changed config options are touched
33  * which then let make pick up the changes and the files that use
34  * the config symbols are rebuilt.
35  *
36  * So if the user changes his CONFIG_HIS_DRIVER option, only the objects
37  * which depend on "include/config/HIS_DRIVER" will be rebuilt,
38  * so most likely only his driver ;-)
39  *
40  * The idea above dates, by the way, back to Michael E Chastain, AFAIK.
41  *
42  * So to get dependencies right, there are two issues:
43  * o if any of the files the compiler read changed, we need to rebuild
44  * o if the command line given to the compile the file changed, we
45  *   better rebuild as well.
46  *
47  * The former is handled by using the -MD output, the later by saving
48  * the command line used to compile the old object and comparing it
49  * to the one we would now use.
50  *
51  * Again, also this idea is pretty old and has been discussed on
52  * kbuild-devel a long time ago. I don't have a sensibly working
53  * internet connection right now, so I rather don't mention names
54  * without double checking.
55  *
56  * This code here has been based partially based on mkdep.c, which
57  * says the following about its history:
58  *
59  *   Copyright abandoned, Michael Chastain, <mailto:[email protected]>.
60  *   This is a C version of syncdep.pl by Werner Almesberger.
61  *
62  *
63  * It is invoked as
64  *
65  *   fixdep <depfile> <target> <cmdline>
66  *
67  * and will read the dependency file <depfile>
68  *
69  * The transformed dependency snipped is written to stdout.
70  *
71  * It first generates a line
72  *
73  *   savedcmd_<target> = <cmdline>
74  *
75  * and then basically copies the .<target>.d file to stdout, in the
76  * process filtering out the dependency on autoconf.h and adding
77  * dependencies on include/config/MY_OPTION for every
78  * CONFIG_MY_OPTION encountered in any of the prerequisites.
79  *
80  * We don't even try to really parse the header files, but
81  * merely grep, i.e. if CONFIG_FOO is mentioned in a comment, it will
82  * be picked up as well. It's not a problem with respect to
83  * correctness, since that can only give too many dependencies, thus
84  * we cannot miss a rebuild. Since people tend to not mention totally
85  * unrelated CONFIG_ options all over the place, it's not an
86  * efficiency problem either.
87  *
88  * (Note: it'd be easy to port over the complete mkdep state machine,
89  *  but I don't think the added complexity is worth it)
90  */
91 
92 #include <sys/types.h>
93 #include <sys/stat.h>
94 #include <unistd.h>
95 #include <fcntl.h>
96 #include <string.h>
97 #include <stdbool.h>
98 #include <stdlib.h>
99 #include <stdio.h>
100 #include <ctype.h>
101 
102 static void usage(void)
103 {
104 	fprintf(stderr, "Usage: fixdep <depfile> <target> <cmdline>\n");
105 	exit(1);
106 }
107 
108 struct item {
109 	struct item	*next;
110 	unsigned int	len;
111 	unsigned int	hash;
112 	char		name[];
113 };
114 
115 #define HASHSZ 256
116 static struct item *hashtab[HASHSZ];
117 
118 static unsigned int strhash(const char *str, unsigned int sz)
119 {
120 	/* fnv32 hash */
121 	unsigned int i, hash = 2166136261U;
122 
123 	for (i = 0; i < sz; i++)
124 		hash = (hash ^ str[i]) * 0x01000193;
125 	return hash;
126 }
127 
128 /*
129  * Lookup a value in the configuration string.
130  */
131 static int is_defined_config(const char *name, int len, unsigned int hash)
132 {
133 	struct item *aux;
134 
135 	for (aux = hashtab[hash % HASHSZ]; aux; aux = aux->next) {
136 		if (aux->hash == hash && aux->len == len &&
137 		    memcmp(aux->name, name, len) == 0)
138 			return 1;
139 	}
140 	return 0;
141 }
142 
143 /*
144  * Add a new value to the configuration string.
145  */
146 static void define_config(const char *name, int len, unsigned int hash)
147 {
148 	struct item *aux = malloc(sizeof(*aux) + len);
149 
150 	if (!aux) {
151 		perror("fixdep:malloc");
152 		exit(1);
153 	}
154 	memcpy(aux->name, name, len);
155 	aux->len = len;
156 	aux->hash = hash;
157 	aux->next = hashtab[hash % HASHSZ];
158 	hashtab[hash % HASHSZ] = aux;
159 }
160 
161 /*
162  * Record the use of a CONFIG_* word.
163  */
164 static void use_config(const char *m, int slen)
165 {
166 	unsigned int hash = strhash(m, slen);
167 
168 	if (is_defined_config(m, slen, hash))
169 	    return;
170 
171 	define_config(m, slen, hash);
172 	/* Print out a dependency path from a symbol name. */
173 	printf("    $(wildcard include/config/%.*s) \\\n", slen, m);
174 }
175 
176 /* test if s ends in sub */
177 static int str_ends_with(const char *s, int slen, const char *sub)
178 {
179 	int sublen = strlen(sub);
180 
181 	if (sublen > slen)
182 		return 0;
183 
184 	return !memcmp(s + slen - sublen, sub, sublen);
185 }
186 
187 static void parse_config_file(const char *p)
188 {
189 	const char *q, *r;
190 	const char *start = p;
191 
192 	while ((p = strstr(p, "CONFIG_"))) {
193 		if (p > start && (isalnum(p[-1]) || p[-1] == '_')) {
194 			p += 7;
195 			continue;
196 		}
197 		p += 7;
198 		q = p;
199 		while (isalnum(*q) || *q == '_')
200 			q++;
201 		if (str_ends_with(p, q - p, "_MODULE"))
202 			r = q - 7;
203 		else
204 			r = q;
205 		if (r > p)
206 			use_config(p, r - p);
207 		p = q;
208 	}
209 }
210 
211 static void *read_file(const char *filename)
212 {
213 	struct stat st;
214 	int fd;
215 	char *buf;
216 
217 	fd = open(filename, O_RDONLY);
218 	if (fd < 0) {
219 		fprintf(stderr, "fixdep: error opening file: ");
220 		perror(filename);
221 		exit(2);
222 	}
223 	if (fstat(fd, &st) < 0) {
224 		fprintf(stderr, "fixdep: error fstat'ing file: ");
225 		perror(filename);
226 		exit(2);
227 	}
228 	buf = malloc(st.st_size + 1);
229 	if (!buf) {
230 		perror("fixdep: malloc");
231 		exit(2);
232 	}
233 	if (read(fd, buf, st.st_size) != st.st_size) {
234 		perror("fixdep: read");
235 		exit(2);
236 	}
237 	buf[st.st_size] = '\0';
238 	close(fd);
239 
240 	return buf;
241 }
242 
243 /* Ignore certain dependencies */
244 static int is_ignored_file(const char *s, int len)
245 {
246 	return str_ends_with(s, len, "include/generated/autoconf.h") ||
247 	       str_ends_with(s, len, "include/generated/autoksyms.h");
248 }
249 
250 /*
251  * Important: The below generated source_foo.o and deps_foo.o variable
252  * assignments are parsed not only by make, but also by the rather simple
253  * parser in scripts/mod/sumversion.c.
254  */
255 static void parse_dep_file(char *p, const char *target)
256 {
257 	bool saw_any_target = false;
258 	bool is_target = true;
259 	bool is_source = false;
260 	bool need_parse;
261 	char *q, saved_c;
262 
263 	while (*p) {
264 		/* handle some special characters first. */
265 		switch (*p) {
266 		case '#':
267 			/*
268 			 * skip comments.
269 			 * rustc may emit comments to dep-info.
270 			 */
271 			p++;
272 			while (*p != '\0' && *p != '\n') {
273 				/*
274 				 * escaped newlines continue the comment across
275 				 * multiple lines.
276 				 */
277 				if (*p == '\\')
278 					p++;
279 				p++;
280 			}
281 			continue;
282 		case ' ':
283 		case '\t':
284 			/* skip whitespaces */
285 			p++;
286 			continue;
287 		case '\\':
288 			/*
289 			 * backslash/newline combinations continue the
290 			 * statement. Skip it just like a whitespace.
291 			 */
292 			if (*(p + 1) == '\n') {
293 				p += 2;
294 				continue;
295 			}
296 			break;
297 		case '\n':
298 			/*
299 			 * Makefiles use a line-based syntax, where the newline
300 			 * is the end of a statement. After seeing a newline,
301 			 * we expect the next token is a target.
302 			 */
303 			p++;
304 			is_target = true;
305 			continue;
306 		case ':':
307 			/*
308 			 * assume the first dependency after a colon as the
309 			 * source file.
310 			 */
311 			p++;
312 			is_target = false;
313 			is_source = true;
314 			continue;
315 		}
316 
317 		/* find the end of the token */
318 		q = p;
319 		while (*q != ' ' && *q != '\t' && *q != '\n' && *q != '#' && *q != ':') {
320 			if (*q == '\\') {
321 				/*
322 				 * backslash/newline combinations work like as
323 				 * a whitespace, so this is the end of token.
324 				 */
325 				if (*(q + 1) == '\n')
326 					break;
327 
328 				/* escaped special characters */
329 				if (*(q + 1) == '#' || *(q + 1) == ':') {
330 					memmove(p + 1, p, q - p);
331 					p++;
332 				}
333 
334 				q++;
335 			}
336 
337 			if (*q == '\0')
338 				break;
339 			q++;
340 		}
341 
342 		/* Just discard the target */
343 		if (is_target) {
344 			p = q;
345 			continue;
346 		}
347 
348 		saved_c = *q;
349 		*q = '\0';
350 		need_parse = false;
351 
352 		/*
353 		 * Do not list the source file as dependency, so that kbuild is
354 		 * not confused if a .c file is rewritten into .S or vice versa.
355 		 * Storing it in source_* is needed for modpost to compute
356 		 * srcversions.
357 		 */
358 		if (is_source) {
359 			/*
360 			 * The DT build rule concatenates multiple dep files.
361 			 * When processing them, only process the first source
362 			 * name, which will be the original one, and ignore any
363 			 * other source names, which will be intermediate
364 			 * temporary files.
365 			 */
366 			if (!saw_any_target) {
367 				saw_any_target = true;
368 				printf("source_%s := %s\n\n", target, p);
369 				printf("deps_%s := \\\n", target);
370 				need_parse = true;
371 			}
372 		} else if (!is_ignored_file(p, q - p)) {
373 			printf("  %s \\\n", p);
374 			need_parse = true;
375 		}
376 
377 		if (need_parse) {
378 			void *buf;
379 
380 			buf = read_file(p);
381 			parse_config_file(buf);
382 			free(buf);
383 		}
384 
385 		is_source = false;
386 		*q = saved_c;
387 		p = q;
388 	}
389 
390 	if (!saw_any_target) {
391 		fprintf(stderr, "fixdep: parse error; no targets found\n");
392 		exit(1);
393 	}
394 
395 	printf("\n%s: $(deps_%s)\n\n", target, target);
396 	printf("$(deps_%s):\n", target);
397 }
398 
399 int main(int argc, char *argv[])
400 {
401 	const char *depfile, *target, *cmdline;
402 	void *buf;
403 
404 	if (argc != 4)
405 		usage();
406 
407 	depfile = argv[1];
408 	target = argv[2];
409 	cmdline = argv[3];
410 
411 	printf("savedcmd_%s := %s\n\n", target, cmdline);
412 
413 	buf = read_file(depfile);
414 	parse_dep_file(buf, target);
415 	free(buf);
416 
417 	fflush(stdout);
418 
419 	/*
420 	 * In the intended usage, the stdout is redirected to .*.cmd files.
421 	 * Call ferror() to catch errors such as "No space left on device".
422 	 */
423 	if (ferror(stdout)) {
424 		fprintf(stderr, "fixdep: not all data was written to the output\n");
425 		exit(1);
426 	}
427 
428 	return 0;
429 }
430