|
[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index] [Xen-devel] [PATCH 4/7] docs/gen-html-index: Extract titles from HTML documents
Signed-off-by: Ian Jackson <Ian.Jackson@xxxxxxxxxxxxx>
---
docs/gen-html-index | 13 +++++++++++++
1 file changed, 13 insertions(+)
diff --git a/docs/gen-html-index b/docs/gen-html-index
index e9792bf..5b43b42 100644
--- a/docs/gen-html-index
+++ b/docs/gen-html-index
@@ -10,6 +10,7 @@ use warnings;
use Getopt::Long;
use IO::File;
use File::Basename;
+use HTML::TreeBuilder::XPath;
Getopt::Long::Configure('bundling');
@@ -64,6 +65,18 @@ sub make_linktext ($) {
return "$1($2)" if $l =~ m,^man/(.*)\.([0-9].*)\.html,;
$l =~ s/.(?:html|txt)$//g;
return $index{$l} if exists $index{$l};
+
+ my $from_html;
+ eval {
+ my $tree = new HTML::TreeBuilder::XPath;
+ my $f = "$outdir/$l.html";
+ open F, '<', $f or die "$l $f $!";
+ $tree->parse_file(\*F) or die;
+ close F;
+ $from_html = $tree->findvalue("/html/head/title");
+ };
+ return $from_html if $from_html;
+
return basename($l);
}
--
2.1.4
_______________________________________________
Xen-devel mailing list
Xen-devel@xxxxxxxxxxxxxxxxxxxx
https://lists.xenproject.org/mailman/listinfo/xen-devel
|
![]() |
Lists.xenproject.org is hosted with RackSpace, monitoring our |