korgupload: stricter filename checking, is_clean_string() in parse

Be stricter about the filename checking and reject more corner cases; in particular, reject any filenames starting with dot entirely. Set the limit for total pathname and filename components significantly below OS limits. This version will run is_clean_string() redundantly on a lot of strings; there simply is no good reason to remove checks already in place. Suggested-by: Linus Torvalds <torvalds@linux-foundation.org> Signed-off-by: H. Peter Anvin <hpa@zytor.com>
author: H. Peter Anvin <hpa@zytor.com> 2011-10-01 18:27:39 -0700
committer: H. Peter Anvin <hpa@zytor.com> 2011-10-01 18:27:39 -0700
commit: 8cf1fdbbb881a43326343b4ba641cf86c6875d4c (patch)
tree: fde135f594de600198f431301d49b9af434bc8a0
parent: 7db3f67f5bc92302ef223e6aea832e9e4bfac08b (diff)
download: kup-8cf1fdbbb881a43326343b4ba641cf86c6875d4c.tar.gz
1 files changed, 33 insertions, 29 deletions
diff --git a/korgupload b/korgupload
index acbe7dd..8cce203 100755
--- a/korgupload
+++ b/korgupload
@@ -137,6 +137,21 @@ sub url_unescape($)
     return $o;
 }
 
+# Return true if the supplied string is valid UTF-8 without special
+# characters
+sub is_clean_string($)
+{
+    no bytes;
+    # use feature 'unicode_strings';	-- is this needed here?
+
+    my($b) = @_;
+    my $f = decode('UTF-8', $b, Encode::FB_DEFAULT);
+
+    return 0 if ($f =~ m:[\x{0000}-\x{001f}\x{007f}-\x{00a0}\x{fffd}-\x{ffff}]:);
+    return 1;
+}    
+
+# Decode the argument line
 sub parse_line($)
 {
     my($line) = @_;
@@ -154,7 +169,7 @@ sub parse_line($)
 
 	foreach my $ra (@rawargs) {
 	    my $a = url_unescape($ra);
-	    return undef if (!defined($a));
+	    return undef if (!defined($a) || !is_clean_string($a));
 	    push(@args, $a);
 	}
     }
@@ -162,40 +177,29 @@ sub parse_line($)
     return ($cmd, @args);
 }
 
-# Return true if the supplied string is valid UTF-8 without special
-# characters
-sub is_clean_string($)
-{
-    no bytes;
-    # use feature 'unicode_strings';	-- is this needed here?
-
-    my($b) = @_;
-    my $f = decode('UTF-8', $b, Encode::FB_DEFAULT);
-
-    return 0 if ($f =~ m:[\x{0000}-\x{001f}\x{007f}-\x{00a0}\x{fffd}-\x{ffff}]:);
-    return 1;
-}    
-
 # This returns true if the given argument is a valid filename in its
-# canonical form.  Double slashes, relative paths, control characters,
-# and malformed UTF-8 is not permitted.  We cap the length of each
-# pathname component to 251 characters to we can add an extension
-# without worrying about it.
+# canonical form.  Double slashes, relative paths, dot files, control
+# characters, and malformed UTF-8 is not permitted.  We cap the length
+# of each pathname component to 100 bytes to we can add an extension
+# without worrying about it, and the entire pathname to 1024 bytes.
 sub is_valid_filename($)
 {
     use bytes;
 
     my($f) = @_;
 
-    return 0 if (!is_clean_string($f));
-    return 0 if ($f !~ m:^/:);
-    return 0 if ($f =~ m:/$:);
-    return 0 if ($f =~ m://:);
-    return 0 if ($f =~ m:/(\.|\.\.)(/|$):);
-
-    # Make sure we can create a 255-byte-long filename after adding
-    # .bz2 or similar.  We can't use the obvious regexp here, because
-    # regexps operate on characters, not bytes.
+    return 0 if (length($f) > 1024); # Reject ridiculously long paths
+    return 0 if (!is_clean_string($f)); # Reject bad UTF-8 and control characters
+    return 0 if ($f !~ m:^/:);	# Reject relative paths
+    return 0 if ($f =~ m:/$:);	# Reject paths ending in /
+    return 0 if ($f =~ m://:);	# Reject double slashes
+    return 0 if ($f =~ m:/\.:);	# Reject any filename component starting with dot,
+    				# including . and ..
+
+    # Make sure we can create a filename after adding .bz2 or similar.
+    # We can't use the obvious regexp here, because regexps operate on
+    # characters, not bytes.  The limit of 100 is semi-arbitrary, but
+    # we shouldn't need filenames that long.
     my $n = 0;
     my $nmax = 0;
     for (my $i = 0; $i < length($f); $i++) {
@@ -203,7 +207,7 @@ sub is_valid_filename($)
 	$n = ($c eq '/') ? 0 : $n+1;
 	$nmax = ($n > $nmax) ? $n : $nmax;
     }
-    return 0 if ($nmax > 251);
+    return 0 if ($nmax > 100);
 
     return 1;
 }
author	H. Peter Anvin <hpa@zytor.com>	2011-10-01 18:27:39 -0700
committer	H. Peter Anvin <hpa@zytor.com>	2011-10-01 18:27:39 -0700
commit	8cf1fdbbb881a43326343b4ba641cf86c6875d4c (patch)
tree	fde135f594de600198f431301d49b9af434bc8a0
parent	7db3f67f5bc92302ef223e6aea832e9e4bfac08b (diff)
download	kup-8cf1fdbbb881a43326343b4ba641cf86c6875d4c.tar.gz