W3C home > Mailing lists > Public > www-validator-cvs@w3.org > August 2010

link-checker commit: improve debug output in verbose mode. Patch courtesy of Michael Ernst

From: Mercurial notifier <nobody@w3.org>
Date: Thu, 05 Aug 2010 14:47:14 +0000
To: link-checker updates <www-validator-cvs@w3.org>
Message-Id: <E1Oh1j0-00063t-Rt@blinky.w3.org>
changeset:   239:e190bd27ade8
user:        ot
date:        Thu Jul 03 19:46:35 2008 +0000
files:       bin/checklink
description:
improve debug output in verbose mode. Patch courtesy of Michael Ernst


diff -r fa96404467ee -r e190bd27ade8 bin/checklink
--- a/bin/checklink	Sun May 04 16:59:22 2008 +0000
+++ b/bin/checklink	Thu Jul 03 19:46:35 2008 +0000
@@ -5,7 +5,7 @@
 # (c) 1999-2008 World Wide Web Consortium
 # based on Renaud Bruyeron's checklink.pl
 #
-# $Id: checklink,v 4.109 2008-05-04 16:59:22 ville Exp $
+# $Id: checklink,v 4.110 2008-07-03 19:46:35 ot Exp $
 #
 # This program is licensed under the W3C(r) Software License:
 #       http://www.w3.org/Consortium/Legal/copyright-software
@@ -134,7 +134,7 @@
 }
 
 #
-# Checks whether we're allowed to retrieve the document based on it's IP
+# Checks whether we're allowed to retrieve the document based on its IP
 # address.  Takes an URI object and returns a HTTP::Response containing the
 # appropriate status and error message if the IP was disallowed, 0
 # otherwise.  URIs without hostname or IP address are always allowed,
@@ -242,7 +242,7 @@
   $PROGRAM     = 'W3C-checklink';
   $VERSION     = '4.3';
   $REVISION    = sprintf('version %s (c) 1999-2008 W3C', $VERSION);
-  my ($cvsver) = q$Revision: 4.109 $ =~ /(\d+[\d\.]*\.\d+)/;
+  my ($cvsver) = q$Revision: 4.110 $ =~ /(\d+[\d\.]*\.\d+)/;
   $AGENT       = sprintf('%s/%s [%s] %s',
                          $PROGRAM, $VERSION, $cvsver, LWP::RobotUA->_agent());
 
@@ -363,6 +363,7 @@
 my %redirects;
 # Count of the number of documents checked
 my $doc_count = 0;
+
 # Time stamp
 my $timestamp = &get_timestamp();
 
@@ -910,6 +911,8 @@
   # Check links
   #############
 
+  &hprintf("Recording all the links found: %d\n", scalar (keys %{$p->{Links}}))
+    if ($Opts{Verbose});
   my %links;
   # Record all the links found
   while (my ($link, $lines) = each(%{$p->{Links}})) {
@@ -943,6 +946,8 @@
   }
 
   # Build the list of broken URI's
+  &hprintf("Checking %d links to build list of broken URI's\n", scalar (keys %links))
+    if ($Opts{Verbose});
   my %broken;
   while (my ($u, $ulinks) = each(%links)) {
 
@@ -1031,7 +1036,7 @@
       if ($Opts{HTML}) {
         if (!$Opts{Command_Line}) {
           if ($doc_count == $Opts{Max_Documents}) {
-            print("<hr />\n<p><strong>Maximum number of documents reached!</strong></p>\n");
+            print("<hr />\n<p><strong>Maximum number of documents ($Opts{Max_Documents}) reached!</strong></p>\n");
           }
           if ($doc_count >= $Opts{Max_Documents}) {
             $doc_count++;
@@ -1335,6 +1340,9 @@
 sub parse_document ($$$$$)
 {
   my ($uri, $base_uri, $response, $links, $rec_needs_links) = @_;
+
+  print("parse_document($uri, $base_uri, ..., $links, $rec_needs_links)\n")
+    if $Opts{Verbose};
 
   my $p;
 
Received on Thursday, 5 August 2010 14:47:26 UTC

This archive was generated by hypermail 2.3.1 : Wednesday, 7 January 2015 15:17:43 UTC