diff options
author | gary <gary@138bc75d-0d04-0410-961f-82ee72b054a4> | 2006-06-06 15:09:20 +0000 |
---|---|---|
committer | gary <gary@138bc75d-0d04-0410-961f-82ee72b054a4> | 2006-06-06 15:09:20 +0000 |
commit | 8dc10789d233904a25d3210557561d4b64210043 (patch) | |
tree | 1bf59618bf924a1b5a39b4a3404428ec2cebfef4 | |
parent | feb71a634d13e4037c9af2306b123097f1e6436f (diff) | |
download | gcc-8dc10789d233904a25d3210557561d4b64210043.tar.gz |
* java/io/natFilePosix.cc (getCanonicalPath): Rewritten.
* configure.ac: Remove realpath check and add checks for
lstat and readlink.
* configure: Rebuilt.
* include/config.h.in: Likewise.
* java/io/File.java: Javadoc fix.
git-svn-id: svn+ssh://gcc.gnu.org/svn/gcc/trunk@114434 138bc75d-0d04-0410-961f-82ee72b054a4
-rw-r--r-- | libjava/ChangeLog | 9 | ||||
-rwxr-xr-x | libjava/configure | 2 | ||||
-rw-r--r-- | libjava/configure.ac | 2 | ||||
-rw-r--r-- | libjava/include/config.h.in | 7 | ||||
-rw-r--r-- | libjava/java/io/File.java | 6 | ||||
-rw-r--r-- | libjava/java/io/natFilePosix.cc | 215 |
6 files changed, 163 insertions, 78 deletions
diff --git a/libjava/ChangeLog b/libjava/ChangeLog index 38660610526..76031d52572 100644 --- a/libjava/ChangeLog +++ b/libjava/ChangeLog @@ -1,3 +1,12 @@ +2006-06-06 Gary Benson <gbenson@redhat.com> + + * java/io/natFilePosix.cc (getCanonicalPath): Rewritten. + * configure.ac: Remove realpath check and add checks for + lstat and readlink. + * configure: Rebuilt. + * include/config.h.in: Likewise. + * java/io/File.java: Javadoc fix. + 2006-06-05 Andreas Schwab <schwab@suse.de> PR libgcj/27860 diff --git a/libjava/configure b/libjava/configure index 96ba1bfacc5..7b3f0f164f5 100755 --- a/libjava/configure +++ b/libjava/configure @@ -10396,7 +10396,7 @@ else for ac_func in strerror ioctl select fstat open fsync sleep opendir \ gmtime_r localtime_r readdir_r getpwuid_r getcwd \ - access stat mkdir rename rmdir unlink realpath utime chmod \ + access stat lstat mkdir rename rmdir unlink utime chmod readlink \ nl_langinfo setlocale \ inet_pton uname inet_ntoa \ fork execvp pipe sigaction ftruncate mmap diff --git a/libjava/configure.ac b/libjava/configure.ac index 28702b00bf7..a02e25f3ab1 100644 --- a/libjava/configure.ac +++ b/libjava/configure.ac @@ -897,7 +897,7 @@ if test "x${with_newlib}" = "xyes"; then else AC_CHECK_FUNCS([strerror ioctl select fstat open fsync sleep opendir \ gmtime_r localtime_r readdir_r getpwuid_r getcwd \ - access stat mkdir rename rmdir unlink realpath utime chmod \ + access stat lstat mkdir rename rmdir unlink utime chmod readlink \ nl_langinfo setlocale \ inet_pton uname inet_ntoa \ fork execvp pipe sigaction ftruncate mmap]) diff --git a/libjava/include/config.h.in b/libjava/include/config.h.in index 5d67c859b10..2ef617103b1 100644 --- a/libjava/include/config.h.in +++ b/libjava/include/config.h.in @@ -169,6 +169,9 @@ /* Define to 1 if you have the `localtime_r' function. */ #undef HAVE_LOCALTIME_R +/* Define to 1 if you have the `lstat' function. */ +#undef HAVE_LSTAT + /* Define to 1 if you have the `memcpy' function. */ #undef HAVE_MEMCPY @@ -226,8 +229,8 @@ /* Define to 1 if you have the `readdir_r' function. */ #undef HAVE_READDIR_R -/* Define to 1 if you have the `realpath' function. */ -#undef HAVE_REALPATH +/* Define to 1 if you have the `readlink' function. */ +#undef HAVE_READLINK /* Define to 1 if you have the `rename' function. */ #undef HAVE_RENAME diff --git a/libjava/java/io/File.java b/libjava/java/io/File.java index 1b02b601aaf..55b7b08b931 100644 --- a/libjava/java/io/File.java +++ b/libjava/java/io/File.java @@ -508,9 +508,9 @@ public class File implements Serializable, Comparable /** * This method returns a canonical representation of the pathname of * this file. The actual form of the canonical representation is - * different. On the GNU system, the canonical form differs from the - * absolute form in that all relative file references to "." and ".." - * are resolved and removed. + * system-dependent. On the GNU system, conversion to canonical + * form involves the removal of redundant separators, references to + * "." and "..", and symbolic links. * <p> * Note that this method, unlike the other methods which return path * names, can throw an IOException. This is because native method diff --git a/libjava/java/io/natFilePosix.cc b/libjava/java/io/natFilePosix.cc index 580b5955ac0..356fc2e5533 100644 --- a/libjava/java/io/natFilePosix.cc +++ b/libjava/java/io/natFilePosix.cc @@ -101,94 +101,167 @@ java::io::File::attr (jint query) #endif } +// These two methods are used to maintain dynamically allocated +// buffers for getCanonicalPath without the overhead of calling +// realloc every time a buffer is modified. Buffers are sized +// at the smallest multiple of CHUNKSIZ that is greater than or +// equal to the desired length. The default CHUNKSIZ is 256, +// longer than most paths, so in most cases a getCanonicalPath +// will require only one malloc per buffer. + +#define CHUNKLOG 8 +#define CHUNKSIZ (1 << CHUNKLOG) + +static int +nextChunkSize (int size) +{ + return ((size >> CHUNKLOG) + ((size & (CHUNKSIZ - 1)) ? 1 : 0)) << CHUNKLOG; +} + +static char * +maybeGrowBuf (char *buf, int *size, int required) +{ + if (required > *size) + { + *size = nextChunkSize (required); + buf = (char *) _Jv_Realloc (buf, *size); + } + return buf; +} + +// Return a canonical representation of the pathname of this file. On +// the GNU system this involves the removal of redundant separators, +// references to "." and "..", and symbolic links. +// +// The conversion proceeds on a component-by-component basis: symbolic +// links and references to ".." are resolved as and when they occur. +// This means that if "/foo/bar" is a symbolic link to "/baz" then the +// canonical form of "/foo/bar/.." is "/" and not "/foo". +// +// In order to mimic the behaviour of proprietary JVMs, non-existant +// path components are allowed (a departure from the normal GNU system +// convention). This means that if "/foo/bar" is a symbolic link to +// "/baz", the canonical form of "/non-existant-directory/../foo/bar" +// is "/baz". + jstring java::io::File::getCanonicalPath (void) { - // We use `+2' here because we might need to use `.' for our special - // case. - char *buf = (char *) __builtin_alloca (JvGetStringUTFLength (path) + 2); - char buf2[MAXPATHLEN]; - jsize total = JvGetStringUTFRegion (path, 0, path->length(), buf); + jstring path = getAbsolutePath (); - // Special case: treat "" the same as ".". - if (total == 0) - buf[total++] = '.'; + int len = JvGetStringUTFLength (path); + int srcl = nextChunkSize (len + 1); + char *src = (char *) _Jv_Malloc (srcl); + JvGetStringUTFRegion (path, 0, path->length(), src); + src[len] = '\0'; + int srci = 1; - buf[total] = '\0'; + int dstl = nextChunkSize (2); + char *dst = (char *) _Jv_Malloc (dstl); + dst[0] = '/'; + int dsti = 1; + + bool fschecks = true; -#ifdef HAVE_REALPATH - if (realpath (buf, buf2) == NULL) + while (src[srci] != '\0') { - // If realpath failed, we have to come up with a canonical path - // anyway. We do this with purely textual manipulation. - // FIXME: this isn't perfect. You can construct a case where - // we get a different answer from the JDK: - // mkdir -p /tmp/a/b/c - // ln -s /tmp/a/b /tmp/a/z - // ... getCanonicalPath("/tmp/a/z/c/nosuchfile") - // We will give /tmp/a/z/c/nosuchfile, while the JDK will - // give /tmp/a/b/c/nosuchfile. - int out_idx; - if (buf[0] != '/') + // Skip slashes. + while (src[srci] == '/') + srci++; + int tmpi = srci; + // Find next slash. + while (src[srci] != '/' && src[srci] != '\0') + srci++; + if (srci == tmpi) + // We hit the end. + break; + len = srci - tmpi; + + // Handle "." and "..". + if (len == 1 && src[tmpi] == '.') + continue; + if (len == 2 && src[tmpi] == '.' && src[tmpi + 1] == '.') { - // Not absolute, so start with current directory. - if (getcwd (buf2, sizeof (buf2)) == NULL) - throw new IOException (); - out_idx = strlen (buf2); + while (dsti > 1 && dst[dsti - 1] != '/') + dsti--; + if (dsti != 1) + dsti--; + // Reenable filesystem checking if disabled, as we might + // have reversed over whatever caused the problem before. + // At least one proprietary JVM has inconsistencies because + // it does not do this. + fschecks = true; + continue; } - else - { - buf2[0] = '/'; - out_idx = 1; - } - int in_idx = 0; - while (buf[in_idx] != '\0') + + // Handle real path components. + dst = maybeGrowBuf (dst, &dstl, dsti + (dsti > 1 ? 1 : 0) + len + 1); + int dsti_save = dsti; + if (dsti > 1) + dst[dsti++] = '/'; + strncpy (&dst[dsti], &src[tmpi], len); + dsti += len; + if (fschecks == false) + continue; + +#if defined (HAVE_LSTAT) && defined (HAVE_READLINK) + struct stat sb; + dst[dsti] = '\0'; + if (::lstat (dst, &sb) == 0) { - // Skip '/'s. - while (buf[in_idx] == '/') - ++in_idx; - int elt_start = in_idx; - // Find next '/' or end of path. - while (buf[in_idx] != '\0' && buf[in_idx] != '/') - ++in_idx; - if (in_idx == elt_start) - { - // An empty component means we've reached the end. - break; - } - int len = in_idx - elt_start; - if (len == 1 && buf[in_idx] == '.') - continue; - if (len == 2 && buf[in_idx] == '.' && buf[in_idx + 1] == '.') - { - // Found ".." component, lop off last part from existing - // buffer. - --out_idx; - while (out_idx > 0 && buf2[out_idx] != '/') - --out_idx; - // Can't go up past "/". - if (out_idx == 0) - ++out_idx; - } - else + if (S_ISLNK (sb.st_mode)) { - // Append a real path component to the output. - if (out_idx > 1) - buf2[out_idx++] = '/'; - strncpy (&buf2[out_idx], &buf[elt_start], len); - out_idx += len; + int tmpl = CHUNKSIZ; + char *tmp = (char *) _Jv_Malloc (tmpl); + + while (1) + { + tmpi = ::readlink (dst, tmp, tmpl); + if (tmpi < 1) + { + _Jv_Free (src); + _Jv_Free (dst); + _Jv_Free (tmp); + throw new IOException ( + JvNewStringLatin1 ("readlink failed")); + } + if (tmpi < tmpl) + break; + tmpl += CHUNKSIZ; + tmp = (char *) _Jv_Realloc (tmp, tmpl); + } + + // Prepend the link's path to src. + tmp = maybeGrowBuf (tmp, &tmpl, tmpi + strlen (&src[srci]) + 1); + strcpy(&tmp[tmpi], &src[srci]); + _Jv_Free (src); + src = tmp; + srcl = tmpl; + srci = 0; + + // Either replace or append dst depending on whether the + // link is relative or absolute. + dsti = src[0] == '/' ? 1 : dsti_save; } } - - buf2[out_idx] = '\0'; + else + { + // Something doesn't exist, or we don't have permission to + // read it, or a previous path component is a directory, or + // a symlink is looped. Whatever, we can't check the + // filesystem any more. + fschecks = false; + } +#endif // HAVE_LSTAT && HAVE_READLINK } + dst[dsti] = '\0'; // FIXME: what encoding to assume for file names? This affects many // calls. - return JvNewStringUTF (buf2); -#else - return JvNewStringUTF (buf); -#endif + path = JvNewStringUTF (dst); + _Jv_Free (src); + _Jv_Free (dst); + return path; } jboolean |