[Reproducible-builds] [strip-nondeterminism] 01/06: Add javadoc handler

Andrew Ayer agwa at andrewayer.name
Sun Sep 14 05:14:41 UTC 2014


This is an automated email from the git hooks/post-receive script.

agwa-guest pushed a commit to branch master
in repository strip-nondeterminism.

commit daae69112a4816bc88e56865bdfd34c4f0b38443
Author: Andrew Ayer <agwa at andrewayer.name>
Date:   Sat Sep 13 16:53:27 2014 -0700

    Add javadoc handler
    
    For now it only handles standalone html files, not html files embedded
    in a Jar file.
---
 lib/StripNondeterminism.pm                  |  6 +++
 lib/StripNondeterminism/handlers/javadoc.pm | 66 +++++++++++++++++++++++++++++
 2 files changed, 72 insertions(+)

diff --git a/lib/StripNondeterminism.pm b/lib/StripNondeterminism.pm
index b01d673..5a225dd 100644
--- a/lib/StripNondeterminism.pm
+++ b/lib/StripNondeterminism.pm
@@ -24,6 +24,7 @@ use warnings;
 use StripNondeterminism::handlers::ar;
 use StripNondeterminism::handlers::gzip;
 use StripNondeterminism::handlers::jar;
+use StripNondeterminism::handlers::javadoc;
 use StripNondeterminism::handlers::zip;
 
 our($VERSION);
@@ -57,6 +58,10 @@ sub get_normalizer_for_file {
 	if (m/\.jar$/ && _get_file_type($_) =~ m/Zip archive data/) {
 		return \&StripNondeterminism::handlers::jar::normalize;
 	}
+	# javadoc
+	if (m/\.html$/ && StripNondeterminism::handlers::javadoc::is_javadoc_file($_)) {
+		return \&StripNondeterminism::handlers::javadoc::normalize;
+	}
 	# zip
 	if (m/\.zip$/ && _get_file_type($_) =~ m/Zip archive data/) {
 		return \&StripNondeterminism::handlers::zip::normalize;
@@ -69,6 +74,7 @@ sub get_normalizer_by_name {
 	return \&StripNondeterminism::handlers::ar::normalize if $_ eq 'ar';
 	return \&StripNondeterminism::handlers::gzip::normalize if $_ eq 'gzip';
 	return \&StripNondeterminism::handlers::jar::normalize if $_ eq 'jar';
+	return \&StripNondeterminism::handlers::javadoc::normalize if $_ eq 'javadoc';
 	return \&StripNondeterminism::handlers::zip::normalize if $_ eq 'zip';
 	return undef;
 }
diff --git a/lib/StripNondeterminism/handlers/javadoc.pm b/lib/StripNondeterminism/handlers/javadoc.pm
new file mode 100644
index 0000000..94ad012
--- /dev/null
+++ b/lib/StripNondeterminism/handlers/javadoc.pm
@@ -0,0 +1,66 @@
+#
+# Copyright 2014 Andrew Ayer
+#
+# This file is part of strip-nondeterminism.
+#
+# strip-nondeterminism is free software: you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation, either version 3 of the License, or
+# (at your option) any later version.
+#
+# strip-nondeterminism is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with strip-nondeterminism.  If not, see <http://www.gnu.org/licenses/>.
+#
+package StripNondeterminism::handlers::javadoc;
+
+use strict;
+use warnings;
+
+use File::Temp qw/tempfile/;
+use File::Basename;
+
+sub is_javadoc_file {
+	my ($filename) = @_;
+
+	# If this is a javadoc file, '<!-- Generated by javadoc' should appear in first 1kb
+	my $fh;
+	my $str;
+	return open($fh, '<', $filename) && read($fh, $str, 1024) && $str =~ /\<!-- Generated by javadoc/;
+}
+
+sub normalize {
+	my ($filename) = @_;
+
+	open(my $fh, '<', $filename) or die "Unable to open $filename for reading: $!";
+	my ($out_fh, $out_filename) = tempfile(DIR => dirname($filename), UNLINK => 1);
+
+	# Strip the javadoc comment, which contains a timestamp.
+	# It should appear within first 10 lines.
+	while (defined(my $line = <$fh>) && $. <= 10) {
+		if ($line =~ /\<!-- Generated by javadoc .* --\>/) {
+			$line =~ s/\<!-- Generated by javadoc .* --\>//g;
+			print $out_fh $line unless $line =~ /^\s*$/; # elide lines that are now whitespace-only
+
+			# Copy through rest of file
+			my $bytes_read;
+			my $buf;
+			while ($bytes_read = read($fh, $buf, 4096)) {
+				print $out_fh $buf;
+			}
+			defined($bytes_read) or die "$filename: read failed: $!";
+
+			# Rename temporary file over the file
+			chmod((stat($fh))[2] & 07777, $out_filename);
+			rename($out_filename, $filename) or die "$filename: unable to overwrite: rename: $!";
+			last;
+		}
+		print $out_fh $line;
+	}
+}
+
+1;

-- 
Alioth's /usr/local/bin/git-commit-notice on /srv/git.debian.org/git/reproducible/strip-nondeterminism.git



More information about the Reproducible-builds mailing list