mirror of
https://git.notmuchmail.org/git/notmuch
synced 2024-11-27 05:07:56 +01:00
1e96445cb5
Setting locale environment variables (LC_* and LANG) to e.g. en_US.utf8 works fine on Linux, and that is what locale -a returns (in Linux). However this does not work e.g. in some *BSD systems. In these systems, en_US.UTF-8 works. This also works in Linux systems (which may look like a surprising thing on the first sight(*)). But that *UTF-8 format seems to be widely used in the Linux system: Grep it through the files in /etc/, for example. Easy way to test: Run the following command lines. First should complain about setting locale failed, and second should not. $ LC_ALL=en_US.UTF-1 perl -e '' $ LC_ALL=en_US.UTF-8 perl -e '' (*) and who knows what the "standard" is...
205 lines
5 KiB
Perl
Executable file
205 lines
5 KiB
Perl
Executable file
#!/usr/bin/perl
|
|
#
|
|
# Author: Tomi Ollila
|
|
# License: same as notmuch
|
|
#
|
|
# This program is used to generate mdwn-formatted notmuch manual pages
|
|
# for notmuch wiki. Example run:
|
|
#
|
|
# $ ./devel/man-to-mdwn.pl doc/_build/man ../notmuch-wiki
|
|
#
|
|
# In case taken into more generic use, modify these comments and examples.
|
|
|
|
use 5.10.1;
|
|
use strict;
|
|
use warnings;
|
|
|
|
unless (@ARGV == 2) {
|
|
warn "\n$0 <source-directory> <destination-directory>\n\n";
|
|
# Remove/edit this comment if this script is taken into generic use.
|
|
warn "Example: ./devel/man-to-mdwn.pl doc/_build/man ../notmuch-wiki\n\n";
|
|
exit 1;
|
|
}
|
|
|
|
die "'$ARGV[0]': no such source directory\n" unless -d $ARGV[0];
|
|
die "'$ARGV[1]': no such destination directory\n" unless -d $ARGV[1];
|
|
|
|
#die "'manpages' exists\n" if -e 'manpages';
|
|
#die "'manpages.mdwn' exists\n" if -e 'manpages.mdwn';
|
|
|
|
die "Expecting '$ARGV[1]/manpages' to exist.\n" .
|
|
"Please create it first or adjust <destination-directory>.\n"
|
|
unless -d $ARGV[1] . '/manpages';
|
|
|
|
my $ev = 0;
|
|
my %fhash;
|
|
|
|
open P, '-|', 'find', $ARGV[0], qw/-name *.[0-9] -print/;
|
|
while (<P>)
|
|
{
|
|
chomp;
|
|
next unless -f $_; # follows symlink.
|
|
$ev = 1, warn "'$_': no such file\n" unless -f $_;
|
|
my ($in, $on) = ($_, $_);
|
|
$on =~ s|.*/||; $on =~ tr/./-/;
|
|
my $f = $fhash{$on};
|
|
$ev = 1, warn "'$in' collides with '$f' ($on.mdwn)\n" if defined $f;
|
|
$fhash{$on} = $in;
|
|
}
|
|
close P;
|
|
|
|
my %htmlqh = qw/& & < < > > ' ' " "/;
|
|
# do html quotation to $_[0] (which is an alias to the given arg)
|
|
sub htmlquote($)
|
|
{
|
|
$_[0] =~ s/([&<>'"])/$htmlqh{$1}/ge;
|
|
}
|
|
|
|
sub maymakelink($);
|
|
sub mayconvert($$);
|
|
|
|
#warn keys %fhash, "\n";
|
|
|
|
while (my ($k, $v) = each %fhash)
|
|
{
|
|
#next if -l $v; # skip symlinks here. -- not... references there may be.
|
|
|
|
my @lines;
|
|
open I, '-|', qw/env -i/, "PATH=$ENV{PATH}",
|
|
qw/TERM=vt100 LANG=en_US.UTF-8 LC_ALL=en_US.UTF-8/,
|
|
qw/GROFF_NO_SGR=1 MAN_KEEP_FORMATTING=1 MANWIDTH=80/,
|
|
qw/man/, $v or die "$!";
|
|
binmode I, ':utf8';
|
|
|
|
my ($emptyline, $pre, $hl) = (0, 0, 'h1');
|
|
while (<I>) {
|
|
if (/^\s*$/) {
|
|
$emptyline = 1;
|
|
next;
|
|
}
|
|
# keep only leftmost in lines like 'NOTMUCH(1) notmuch NOTMUCH(1)'
|
|
s/\S\K\s{8,}\S.+\s{8,}\S.*//; # $hl = 'h1' if s/(?<=\S)\s{8,}.*//;
|
|
s/[_&]\010&/&/g;
|
|
s/((?:_\010[^_])+)/\001u\002$1\001\/u\002/g;
|
|
s/_\010(.)/$1/g;
|
|
s/((?:.\010.)+)/\001b\002$1\001\/b\002/g;
|
|
s/.\010(.)/$1/g;
|
|
htmlquote $_;
|
|
s/\001/</g; s/\002/>/g;
|
|
|
|
if (/^\S/) {
|
|
$pre = 0, push @lines, "</pre>\n" if $pre;
|
|
s/<\/?b>//g;
|
|
chomp;
|
|
$_ = "\n<$hl>$_</$hl>\n";
|
|
$hl = 'h2';
|
|
$emptyline = 0;
|
|
}
|
|
elsif (/^\s\s\s\S/) {
|
|
$pre = 0, push @lines, "</pre>\n" if $pre;
|
|
s/(?:^\s+)?<\/?b>//g;
|
|
chomp;
|
|
$_ = "\n<h3> $_</h3>\n";
|
|
$emptyline = 0;
|
|
}
|
|
else {
|
|
$pre = 1, push @lines, "<pre>\n" unless $pre;
|
|
$emptyline = 0, push @lines, "\n" if $emptyline;
|
|
}
|
|
push @lines, $_;
|
|
}
|
|
$lines[0] =~ s/^\n//;
|
|
$k = "$ARGV[1]/manpages/$k.mdwn";
|
|
open O, '>', $k or die;
|
|
binmode O, ':utf8';
|
|
print STDOUT 'Writing ', "'$k'\n";
|
|
select O;
|
|
my ($pe, $hyphen) = ('', '');
|
|
foreach (@lines) {
|
|
#print $_; next;
|
|
if ($pe) {
|
|
if (s/^(\s+)<b>([^<]+)\((\d+)\)<\/b>//) {
|
|
my $link = maymakelink "$pe-$2-$3";
|
|
$link = maymakelink "$pe$2-$3" unless $link;
|
|
if ($link) {
|
|
print "<a href='$link'>$pe$hyphen</a>\n";
|
|
print "$1<a href='$link'>$2</a>($3)";
|
|
}
|
|
else {
|
|
print "<b>$pe-</b>\n";
|
|
print "$1<b>$2</b>($3)";
|
|
}
|
|
} else {
|
|
print "<b>$pe-</b>\n";
|
|
}
|
|
$pe = '';
|
|
}
|
|
s/<b>([^<]+)\((\d+)\)<\/b>/mayconvert($1, $2)/ge;
|
|
($pe, $hyphen) = ($1, $2) if s/<b>([^<]+)([-\x{2010}])<\/b>\s*$//;
|
|
print $_;
|
|
}
|
|
}
|
|
|
|
sub maymakelink($)
|
|
{
|
|
# warn "$_[0]\n";
|
|
return "../$_[0]/" if exists $fhash{$_[0]};
|
|
return '';
|
|
}
|
|
|
|
sub mayconvert($$)
|
|
{
|
|
my $f = "$_[0]-$_[1]";
|
|
# warn "$f\n";
|
|
return "<a href='../$f/'>$_[0]</a>($_[1])" if exists $fhash{$f};
|
|
return "<b>$_[0]</b>($_[1])";
|
|
}
|
|
|
|
# Finally, make manpages.mdwn
|
|
|
|
open O, '>', $ARGV[1] . '/manpages.mdwn' or die $!;
|
|
print STDOUT "Writing '$ARGV[1]/manpages.mdwn'\n";
|
|
select O;
|
|
print "Manual page index\n";
|
|
print "=================\n\n";
|
|
|
|
sub srt { my ($x, $y) = ($a, $b); $x =~ tr/./-/; $y =~ tr/./-/; $x cmp $y; }
|
|
|
|
foreach (sort srt values %fhash)
|
|
{
|
|
my $in = $_;
|
|
open I, '<', $in or die $!;
|
|
my $s;
|
|
while (<I>) {
|
|
if (/^\s*[.]TH\s+\S+\s+"?(\S+?)"?\s/) {
|
|
$s = $1;
|
|
last;
|
|
}
|
|
}
|
|
while (<I>) {
|
|
last if /^\s*[.]SH NAME/
|
|
}
|
|
my $line = '';
|
|
while (<I>) {
|
|
tr/\\//d;
|
|
if (/\s*(\S+)\s+(.*)/) {
|
|
my $e = $2;
|
|
# Ignoring the NAME in file, get from file name instead.
|
|
#my $on = (-l $in)? readlink $in: $in;
|
|
my $on = $in;
|
|
$on =~ tr/./-/; $on =~ s|.*/||;
|
|
my $n = $in; $n =~ s|.*/||; $n =~ tr/./-/; $n =~ s/-[^-]+$//;
|
|
$line = "<a href='$on/'>$n</a>($s) $e\n";
|
|
last;
|
|
}
|
|
}
|
|
die "No NAME in '$in'\n" unless $line;
|
|
print "* $line";
|
|
#warn $line;
|
|
}
|
|
print <<'EOF';
|
|
|
|
The manual pages are licensed under
|
|
[the GNU General Public License](https://www.gnu.org/licenses/gpl.txt),
|
|
either version 3.0 or at your option any later version.
|
|
EOF
|