ccache/ccache.c

539 lines
12 KiB
C
Raw Normal View History

2002-03-26 15:46:43 +01:00
/*
a re-implementation of the compilercache scripts in C
The idea is based on the shell-script compilercache by Erik Thiele <erikyyy@erikyyy.de>
2002-03-27 00:58:31 +01:00
Copyright (C) Andrew Tridgell 2002
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; either version 2 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
2002-03-26 15:46:43 +01:00
*/
#include "ccache.h"
2002-03-27 00:58:31 +01:00
static char *cache_dir;
char *cache_logfile = NULL;
2002-03-26 15:46:43 +01:00
static ARGS *stripped_args;
static ARGS *orig_args;
static char *output_file;
static char *hashname;
static int found_debug;
2002-03-27 00:58:31 +01:00
/*
something went badly wrong - just execute the real compiler
*/
2002-03-26 15:46:43 +01:00
static void failed(void)
{
execv(orig_args->argv[0], orig_args->argv);
cc_log("execv returned (%s)!\n", strerror(errno));
exit(1);
}
/* run the real compiler and put the result in cache */
static void to_cache(ARGS *args)
{
2002-03-27 01:39:06 +01:00
char *path_stderr;
char *tmp_stdout, *tmp_stderr, *tmp_hashname;
2002-03-26 15:46:43 +01:00
struct stat st;
2002-03-27 01:39:06 +01:00
int status;
2002-03-26 15:46:43 +01:00
2002-03-27 01:39:06 +01:00
x_asprintf(&tmp_stdout, "%s/tmp.stdout.%d", cache_dir, getpid());
x_asprintf(&tmp_stderr, "%s/tmp.stderr.%d", cache_dir, getpid());
x_asprintf(&tmp_hashname, "%s/tmp.hash.%d.o", cache_dir, getpid());
2002-03-26 15:46:43 +01:00
args_add(args, "-o");
2002-03-27 01:39:06 +01:00
args_add(args, tmp_hashname);
status = execute(args->argv, tmp_stdout, tmp_stderr);
args->argc -= 2;
2002-03-26 15:46:43 +01:00
if (stat(tmp_stdout, &st) != 0 || st.st_size != 0) {
cc_log("compiler produced stdout for %s\n", output_file);
2002-03-27 01:39:06 +01:00
unlink(tmp_stdout);
unlink(tmp_stderr);
unlink(tmp_hashname);
failed();
}
unlink(tmp_stdout);
2002-03-26 15:46:43 +01:00
if (status != 0) {
int fd;
cc_log("compile of %s gave status = %d\n", output_file, status);
fd = open(tmp_stderr, O_RDONLY);
if (fd != -1 &&
(rename(tmp_hashname, output_file) == 0 || errno == ENOENT)) {
/* we can use a quick method of getting the failed output */
copy_fd(fd, 2);
close(fd);
unlink(tmp_stderr);
exit(status);
}
2002-03-27 01:39:06 +01:00
unlink(tmp_stderr);
unlink(tmp_hashname);
failed();
}
2002-03-26 15:46:43 +01:00
2002-03-27 01:39:06 +01:00
x_asprintf(&path_stderr, "%s.stderr", hashname);
if (rename(tmp_hashname, hashname) != 0 ||
rename(tmp_stderr, path_stderr) != 0) {
cc_log("failed to rename tmp files\n");
2002-03-26 15:46:43 +01:00
failed();
}
cc_log("Placed %s into cache\n", output_file);
2002-03-27 01:39:06 +01:00
free(tmp_hashname);
free(tmp_stderr);
free(tmp_stdout);
free(path_stderr);
2002-03-26 15:46:43 +01:00
}
2002-03-27 00:58:31 +01:00
/* hash a file that consists of preprocessor output, but remove any line
number information from the hash
*/
2002-03-26 15:46:43 +01:00
static void stabs_hash(const char *fname)
{
int fd;
struct stat st;
char *map;
int l_start, l_end;
fd = open(fname, O_RDONLY);
if (fd == -1 || fstat(fd, &st) != 0) {
cc_log("Failed to open preprocessor output %s\n", fname);
2002-03-27 00:58:31 +01:00
failed();
}
2002-03-26 15:46:43 +01:00
2002-03-27 09:02:24 +01:00
/* we use mmap() to make it easy to handle arbitrarily long
2002-03-27 08:12:30 +01:00
lines in preprocessor output. I have seen lines of over
100k in length, so this is well worth it */
map = mmap(NULL, st.st_size, PROT_READ, MAP_PRIVATE, fd, 0);
if (map == (void *)-1) {
cc_log("Failed to mmap %s\n", fname);
2002-03-26 15:46:43 +01:00
failed();
}
close(fd);
2002-03-26 15:46:43 +01:00
l_start = 0;
while (l_start < st.st_size) {
l_end = l_start;
while (l_end < st.st_size && map[l_end] != '\n') {
l_end++;
}
2002-03-27 08:12:30 +01:00
/* skip the hash on any lines that look like compiler line
numbers */
if ((l_end - l_start) > 2 &&
map[l_start] == '#' && map[l_start+1] == ' ' &&
isdigit(map[l_start+2])) {
l_start = l_end+1;
2002-03-26 15:46:43 +01:00
continue;
}
hash_buffer(&map[l_start], 1 + l_end - l_start);
l_start = l_end+1;
2002-03-26 15:46:43 +01:00
}
munmap(map, st.st_size);
2002-03-26 15:46:43 +01:00
}
/* find the hash for a command. The hash includes all argument lists,
plus the output from running the compiler with -E */
static void find_hash(ARGS *args)
{
int i;
2002-03-27 01:39:06 +01:00
char *path_stdout, *path_stderr;
2002-03-26 16:11:48 +01:00
char *hash_dir;
char *s;
struct stat st;
2002-03-27 01:39:06 +01:00
int status;
2002-03-26 15:46:43 +01:00
hash_start();
/* first the arguments */
for (i=0;i<args->argc;i++) {
/* some arguments don't contribute to the hash. The
theory is that these arguments will change the
output of -E if they are going to have any effect
at all, or they only affect linking */
if (i < args->argc-1) {
if (strcmp(args->argv[i], "-I") == 0 ||
strcmp(args->argv[i], "-include") == 0 ||
strcmp(args->argv[i], "-L") == 0 ||
strcmp(args->argv[i], "-D") == 0 ||
strcmp(args->argv[i], "-isystem") == 0) {
i++;
continue;
}
if (strncmp(args->argv[i], "-I", 2) == 0 ||
strncmp(args->argv[i], "-L", 2) == 0 ||
2002-03-27 09:02:24 +01:00
strncmp(args->argv[i], "-D", 2) == 0 ||
strncmp(args->argv[i], "-isystem", 8) == 0) {
continue;
}
}
2002-03-26 15:46:43 +01:00
hash_string(args->argv[i]);
}
/* the compiler driver size and date. This is a simple minded way
to try and detect compiler upgrades. It is not 100% reliable */
if (stat(args->argv[0], &st) != 0) {
cc_log("Couldn't stat the compiler!?\n");
failed();
}
hash_int(st.st_size);
hash_int(st.st_mtime);
2002-03-26 15:46:43 +01:00
/* now the run */
x_asprintf(&path_stdout, "%s/tmp.stdout.%d", cache_dir, getpid());
x_asprintf(&path_stderr, "%s/tmp.stderr.%d", cache_dir, getpid());
args_add(args, "-E");
2002-03-27 01:39:06 +01:00
status = execute(args->argv, path_stdout, path_stderr);
2002-03-26 15:46:43 +01:00
args->argc--;
2002-03-27 01:39:06 +01:00
if (status != 0) {
unlink(path_stdout);
unlink(path_stderr);
cc_log("the preprocessor gave %d\n", status);
failed();
}
/* if the compilation is with -g then we have to inlcude the whole of the
preprocessor output, which means we are sensitive to line number
information. Otherwise we can discard line number info, which makes
us less sensitive to reformatting changes
*/
2002-03-26 15:46:43 +01:00
if (found_debug) {
hash_file(path_stdout);
} else {
stabs_hash(path_stdout);
}
hash_file(path_stderr);
unlink(path_stdout);
unlink(path_stderr);
free(path_stdout);
free(path_stderr);
2002-03-27 00:58:31 +01:00
/* we use a single level subdir for the cache path to reduce the impact
on filesystems which are slow for large directories
*/
2002-03-26 16:11:48 +01:00
s = hash_result();
x_asprintf(&hash_dir, "%s/%c", cache_dir, *s);
if (create_dir(hash_dir) != 0) {
cc_log("failed to create %s\n", cache_dir);
failed();
}
2002-03-26 16:11:48 +01:00
x_asprintf(&hashname, "%s/%s", hash_dir, s+1);
free(hash_dir);
2002-03-26 15:46:43 +01:00
}
/*
try to return the compile result from cache. If we can return from
cache then this function exits with the correct status code,
otherwise it returns */
static void from_cache(int first)
{
2002-03-27 01:39:06 +01:00
int fd_stderr;
2002-03-26 15:46:43 +01:00
char *s;
2002-03-27 01:39:06 +01:00
int ret;
2002-03-26 15:46:43 +01:00
x_asprintf(&s, "%s.stderr", hashname);
fd_stderr = open(s, O_RDONLY);
free(s);
if (fd_stderr == -1) {
2002-03-27 01:39:06 +01:00
/* it isn't in cache ... */
2002-03-26 15:46:43 +01:00
return;
}
unlink(output_file);
ret = link(hashname, output_file);
if (ret == -1 && errno != ENOENT) {
ret = copy_file(hashname, output_file);
if (ret == -1 && errno != ENOENT) {
cc_log("failed to copy %s -> %s (%s)\n",
hashname, output_file, strerror(errno));
failed();
}
}
if (ret == 0) {
utime(output_file, NULL);
2002-03-26 15:46:43 +01:00
}
/* send the stderr */
copy_fd(fd_stderr, 2);
close(fd_stderr);
/* and exit with the right status code */
if (first) {
2002-03-27 01:39:06 +01:00
cc_log("got cached result for %s\n", output_file);
2002-03-26 16:11:48 +01:00
}
2002-03-27 01:39:06 +01:00
exit(0);
2002-03-26 15:46:43 +01:00
}
2002-03-27 00:58:31 +01:00
/* find the real compiler. We just search the PATH to find a executable of the
same name that isn't a link to ourselves */
2002-03-26 15:46:43 +01:00
static char *find_compiler(const char *argv0)
{
char *p;
char *base;
char *path, *tok;
struct stat st1, st2;
int found_one = 0;
2002-03-26 15:46:43 +01:00
p = strrchr(argv0, '/');
if (p) {
base = x_strdup(p+1);
2002-03-26 15:46:43 +01:00
} else {
base = x_strdup(argv0);
}
/* try to find ourselves the linux way */
if (stat("/proc/self/exe", &st1) == 0) {
found_one = 1;
}
/* they might have given a full path ... */
if (!found_one && strchr(argv0, '/') && stat(argv0, &st1) == 0) {
found_one = 1;
2002-03-26 15:46:43 +01:00
}
path = getenv("CCACHE_PATH");
if (!path) {
path = getenv("PATH");
}
if (!path) {
cc_log("no PATH variable!?\n");
failed();
}
2002-03-26 15:46:43 +01:00
path = x_strdup(path);
/* search the path looking for the first compiler of the same name
that isn't us */
for (tok=strtok(path,":"); tok; tok = strtok(NULL, ":")) {
char *fname;
x_asprintf(&fname, "%s/%s", tok, base);
/* look for a normal executable file */
if (access(fname, X_OK) == 0 &&
stat(fname, &st2) == 0 &&
S_ISREG(st2.st_mode)) {
/* we have a candidate */
if (!found_one) {
st1 = st2;
found_one = 1;
continue;
}
2002-03-26 15:46:43 +01:00
if (st1.st_size != st2.st_size ||
st1.st_dev != st2.st_dev ||
st1.st_ino != st2.st_ino) {
/* found it! */
free(path);
return fname;
}
}
}
return NULL;
}
2002-03-27 00:58:31 +01:00
/*
process the compiler options to form the correct set of options
for obtaining the preprocessor output
*/
2002-03-26 15:46:43 +01:00
static void process_args(int argc, char **argv)
{
int i;
int found_c_opt = 0;
int found_S_opt = 0;
2002-03-26 15:46:43 +01:00
char *input_file = NULL;
stripped_args = args_init();
args_add(stripped_args, argv[0]);
for (i=1; i<argc; i++) {
2002-03-27 08:31:55 +01:00
/* some options will never work ... */
if (strncmp(argv[i], "-E", 2) == 0 ||
strncmp(argv[i], "-M", 2) == 0) {
2002-03-26 15:46:43 +01:00
failed();
}
2002-03-27 00:58:31 +01:00
/* we must have -c */
2002-03-26 15:46:43 +01:00
if (strcmp(argv[i], "-c") == 0) {
args_add(stripped_args, argv[i]);
found_c_opt = 1;
continue;
}
/* -S changes the default extension */
if (strcmp(argv[i], "-S") == 0) {
args_add(stripped_args, argv[i]);
found_S_opt = 1;
continue;
}
2002-03-27 00:58:31 +01:00
/* we need to work out where the output was meant to go */
2002-03-26 15:46:43 +01:00
if (strcmp(argv[i], "-o") == 0) {
if (i == argc-1) {
cc_log("missing argument to %s\n", argv[i]);
failed();
}
output_file = argv[i+1];
i++;
continue;
}
2002-03-27 00:58:31 +01:00
/* debugging is handled specially, so that we know if we
can strip line number info
*/
2002-03-26 15:46:43 +01:00
if (strncmp(argv[i], "-g", 2) == 0) {
args_add(stripped_args, argv[i]);
if (strcmp(argv[i], "-g0") != 0) {
found_debug = 1;
}
continue;
}
/* options that take an argument */
if (strcmp(argv[i], "-I") == 0 ||
strcmp(argv[i], "-include") == 0 ||
strcmp(argv[i], "-L") == 0 ||
strcmp(argv[i], "-D") == 0 ||
strcmp(argv[i], "-isystem") == 0) {
if (i == argc-1) {
cc_log("missing argument to %s\n", argv[i]);
failed();
}
args_add(stripped_args, argv[i]);
args_add(stripped_args, argv[i+1]);
i++;
continue;
}
2002-03-27 00:58:31 +01:00
/* other options */
2002-03-26 15:46:43 +01:00
if (argv[i][0] == '-') {
args_add(stripped_args, argv[i]);
continue;
}
if (input_file) {
cc_log("multiple input files (%s and %s)\n",
input_file, argv[i]);
failed();
}
input_file = argv[i];
args_add(stripped_args, argv[i]);
}
2002-03-26 16:11:48 +01:00
if (!input_file) {
cc_log("No input file found\n");
2002-03-26 15:46:43 +01:00
failed();
}
2002-03-26 16:11:48 +01:00
if (!found_c_opt) {
cc_log("No -c option found for %s\n", input_file);
2002-03-26 15:46:43 +01:00
failed();
}
if (!output_file) {
char *p;
2002-03-27 00:58:31 +01:00
output_file = x_strdup(input_file);
2002-03-26 15:46:43 +01:00
if ((p = strrchr(output_file, '/'))) {
output_file = p+1;
}
p = strrchr(output_file, '.');
if (!p || !p[1]) {
cc_log("badly formed output_file %s\n", output_file);
failed();
}
p[1] = found_S_opt ? 's' : 'o';
2002-03-26 15:46:43 +01:00
p[2] = 0;
#if 0
cc_log("Formed output file %s from input_file %s\n",
output_file, input_file);
#endif
}
}
2002-03-27 00:58:31 +01:00
/* the main ccache driver function */
2002-03-26 15:46:43 +01:00
static void ccache(int argc, char *argv[])
{
/* find the real compiler */
argv[0] = find_compiler(argv[0]);
if (!argv[0]) {
exit(STATUS_NOTFOUND);
}
orig_args = args_init();
orig_args->argv = argv;
orig_args->argc = argc;
2002-03-27 07:15:32 +01:00
if (getenv("CCACHE_DISABLE")) {
cc_log("ccache is disabled\n");
failed();
}
2002-03-26 15:46:43 +01:00
/* process argument list, returning a new set of arguments for pre-processing */
process_args(argc, argv);
/* run with -E to find the hash */
find_hash(stripped_args);
/* if we can return from cache at this point then do */
from_cache(1);
/* run real compiler, semding output to cache */
to_cache(stripped_args);
/* return from cache */
from_cache(0);
/* oh oh! */
cc_log("secondary from_cache failed!\n");
failed();
}
int main(int argc, char *argv[])
{
2002-03-27 00:58:31 +01:00
cache_dir = getenv("CCACHE_DIR");
if (!cache_dir) {
x_asprintf(&cache_dir, "%s/.ccache", getenv("HOME"));
}
2002-03-27 00:58:31 +01:00
cache_logfile = getenv("CCACHE_LOGFILE");
/* make sure the cache dir exists */
if (create_dir(cache_dir) != 0) {
fprintf(stderr,"ccache: failed to create %s (%s)\n",
2002-03-26 15:46:43 +01:00
cache_dir, strerror(errno));
exit(1);
}
2002-03-27 00:58:31 +01:00
2002-03-26 15:46:43 +01:00
ccache(argc, argv);
return 1;
}