527 lines
		
	
	
		
			13 KiB
		
	
	
	
		
			Perl
		
	
	
		
			Executable File
		
	
	
	
	
			
		
		
	
	
			527 lines
		
	
	
		
			13 KiB
		
	
	
	
		
			Perl
		
	
	
		
			Executable File
		
	
	
	
	
#!/usr/bin/env perl
 | 
						|
#***************************************************************************
 | 
						|
#                                  _   _ ____  _
 | 
						|
#  Project                     ___| | | |  _ \| |
 | 
						|
#                             / __| | | | |_) | |
 | 
						|
#                            | (__| |_| |  _ <| |___
 | 
						|
#                             \___|\___/|_| \_\_____|
 | 
						|
#
 | 
						|
# Copyright (C) Daniel Stenberg, <daniel@haxx.se>, et al.
 | 
						|
#
 | 
						|
# This software is licensed as described in the file COPYING, which
 | 
						|
# you should have received as part of this distribution. The terms
 | 
						|
# are also available at https://curl.se/docs/copyright.html.
 | 
						|
#
 | 
						|
# You may opt to use, copy, modify, merge, publish, distribute and/or sell
 | 
						|
# copies of the Software, and permit persons to whom the Software is
 | 
						|
# furnished to do so, under the terms of the COPYING file.
 | 
						|
#
 | 
						|
# This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
 | 
						|
# KIND, either express or implied.
 | 
						|
#
 | 
						|
# SPDX-License-Identifier: curl
 | 
						|
#
 | 
						|
###########################################################################
 | 
						|
 | 
						|
=begin comment
 | 
						|
 | 
						|
Converts a curldown file to nroff (man page).
 | 
						|
 | 
						|
=end comment
 | 
						|
=cut
 | 
						|
 | 
						|
use strict;
 | 
						|
use warnings;
 | 
						|
 | 
						|
my $cd2nroff = "0.1"; # to keep check
 | 
						|
my $dir;
 | 
						|
my $extension;
 | 
						|
my $keepfilename;
 | 
						|
 | 
						|
while(@ARGV) {
 | 
						|
    if($ARGV[0] eq "-d") {
 | 
						|
        shift @ARGV;
 | 
						|
        $dir = shift @ARGV;
 | 
						|
    }
 | 
						|
    elsif($ARGV[0] eq "-e") {
 | 
						|
        shift @ARGV;
 | 
						|
        $extension = shift @ARGV;
 | 
						|
    }
 | 
						|
    elsif($ARGV[0] eq "-k") {
 | 
						|
        shift @ARGV;
 | 
						|
        $keepfilename = 1;
 | 
						|
    }
 | 
						|
    elsif($ARGV[0] eq "-h") {
 | 
						|
        print <<HELP
 | 
						|
Usage: cd2nroff [options] [file.md]
 | 
						|
 | 
						|
-d <dir> Write the output to the file name from the meta-data in the
 | 
						|
         specified directory, instead of writing to stdout
 | 
						|
-e <ext> If -d is used, this option can provide an added "extension", arbitrary
 | 
						|
         text really, to append to the file name.
 | 
						|
-h       This help text,
 | 
						|
-v       Show version then exit
 | 
						|
HELP
 | 
						|
            ;
 | 
						|
        exit 0;
 | 
						|
    }
 | 
						|
    elsif($ARGV[0] eq "-v") {
 | 
						|
        print "cd2nroff version $cd2nroff\n";
 | 
						|
        exit 0;
 | 
						|
    }
 | 
						|
    else {
 | 
						|
        last;
 | 
						|
    }
 | 
						|
}
 | 
						|
 | 
						|
use POSIX qw(strftime);
 | 
						|
my @ts;
 | 
						|
if (defined($ENV{SOURCE_DATE_EPOCH})) {
 | 
						|
    @ts = gmtime($ENV{SOURCE_DATE_EPOCH});
 | 
						|
} else {
 | 
						|
    @ts = localtime;
 | 
						|
}
 | 
						|
my $date = strftime "%Y-%m-%d", @ts;
 | 
						|
 | 
						|
sub outseealso {
 | 
						|
    my (@sa) = @_;
 | 
						|
    my $comma = 0;
 | 
						|
    my @o;
 | 
						|
    push @o, ".SH SEE ALSO\n";
 | 
						|
    for my $s (sort @sa) {
 | 
						|
        push @o, sprintf "%s.BR $s", $comma ? ",\n": "";
 | 
						|
        $comma = 1;
 | 
						|
    }
 | 
						|
    push @o, "\n";
 | 
						|
    return @o;
 | 
						|
}
 | 
						|
 | 
						|
sub outprotocols {
 | 
						|
    my (@p) = @_;
 | 
						|
    my $comma = 0;
 | 
						|
    my @o;
 | 
						|
    push @o, ".SH PROTOCOLS\n";
 | 
						|
 | 
						|
    if($p[0] eq "TLS") {
 | 
						|
        push @o, "All TLS based protocols: HTTPS, FTPS, IMAPS, POP3S, SMTPS etc.";
 | 
						|
    }
 | 
						|
    else {
 | 
						|
        my @s = sort @p;
 | 
						|
        for my $e (sort @s) {
 | 
						|
            push @o, sprintf "%s$e",
 | 
						|
                $comma ? (($e eq $s[-1]) ? " and " : ", "): "";
 | 
						|
            $comma = 1;
 | 
						|
        }
 | 
						|
    }
 | 
						|
    push @o, "\n";
 | 
						|
    return @o;
 | 
						|
}
 | 
						|
 | 
						|
sub outtls {
 | 
						|
    my (@t) = @_;
 | 
						|
    my $comma = 0;
 | 
						|
    my @o;
 | 
						|
    if($t[0] eq "All") {
 | 
						|
        push @o, "\nAll TLS backends support this option.";
 | 
						|
    }
 | 
						|
    else {
 | 
						|
        push @o, "\nThis option works only with the following TLS backends:\n";
 | 
						|
        my @s = sort @t;
 | 
						|
        for my $e (@s) {
 | 
						|
            push @o, sprintf "%s$e",
 | 
						|
                $comma ? (($e eq $s[-1]) ? " and " : ", "): "";
 | 
						|
            $comma = 1;
 | 
						|
        }
 | 
						|
    }
 | 
						|
    push @o, "\n";
 | 
						|
    return @o;
 | 
						|
}
 | 
						|
 | 
						|
my %knownprotos = (
 | 
						|
    'DICT' => 1,
 | 
						|
    'FILE' => 1,
 | 
						|
    'FTP' => 1,
 | 
						|
    'FTPS' => 1,
 | 
						|
    'GOPHER' => 1,
 | 
						|
    'GOPHERS' => 1,
 | 
						|
    'HTTP' => 1,
 | 
						|
    'HTTPS' => 1,
 | 
						|
    'IMAP' => 1,
 | 
						|
    'IMAPS' => 1,
 | 
						|
    'LDAP' => 1,
 | 
						|
    'LDAPS' => 1,
 | 
						|
    'MQTT' => 1,
 | 
						|
    'POP3' => 1,
 | 
						|
    'POP3S' => 1,
 | 
						|
    'RTMP' => 1,
 | 
						|
    'RTMPS' => 1,
 | 
						|
    'RTSP' => 1,
 | 
						|
    'SCP' => 1,
 | 
						|
    'SFTP' => 1,
 | 
						|
    'SMB' => 1,
 | 
						|
    'SMBS' => 1,
 | 
						|
    'SMTP' => 1,
 | 
						|
    'SMTPS' => 1,
 | 
						|
    'TELNET' => 1,
 | 
						|
    'TFTP' => 1,
 | 
						|
    'WS' => 1,
 | 
						|
    'WSS' => 1,
 | 
						|
    'TLS' => 1,
 | 
						|
    'TCP' => 1,
 | 
						|
    'All' => 1
 | 
						|
    );
 | 
						|
 | 
						|
my %knowntls = (
 | 
						|
    'BearSSL' => 1,
 | 
						|
    'GnuTLS' => 1,
 | 
						|
    'mbedTLS' => 1,
 | 
						|
    'OpenSSL' => 1,
 | 
						|
    'rustls' => 1,
 | 
						|
    'Schannel' => 1,
 | 
						|
    'Secure Transport' => 1,
 | 
						|
    'wolfSSL' => 1,
 | 
						|
    'All' => 1,
 | 
						|
    );
 | 
						|
 | 
						|
sub single {
 | 
						|
    my @seealso;
 | 
						|
    my @proto;
 | 
						|
    my @tls;
 | 
						|
    my $d;
 | 
						|
    my ($f)=@_;
 | 
						|
    my $copyright;
 | 
						|
    my $errors = 0;
 | 
						|
    my $fh;
 | 
						|
    my $line;
 | 
						|
    my $list;
 | 
						|
    my $tlslist;
 | 
						|
    my $section;
 | 
						|
    my $source;
 | 
						|
    my $spdx;
 | 
						|
    my $start = 0;
 | 
						|
    my $title;
 | 
						|
 | 
						|
    if(defined($f)) {
 | 
						|
        if(!open($fh, "<:crlf", "$f")) {
 | 
						|
            print STDERR "cd2nroff failed to open '$f' for reading: $!\n";
 | 
						|
            return 1;
 | 
						|
        }
 | 
						|
    }
 | 
						|
    else {
 | 
						|
        $f = "STDIN";
 | 
						|
        $fh = \*STDIN;
 | 
						|
        binmode($fh, ":crlf");
 | 
						|
    }
 | 
						|
    while(<$fh>) {
 | 
						|
        $line++;
 | 
						|
        if(!$start) {
 | 
						|
            if(/^---/) {
 | 
						|
                # header starts here
 | 
						|
                $start = 1;
 | 
						|
            }
 | 
						|
            next;
 | 
						|
        }
 | 
						|
        if(/^Title: *(.*)/i) {
 | 
						|
            $title=$1;
 | 
						|
        }
 | 
						|
        elsif(/^Section: *(.*)/i) {
 | 
						|
            $section=$1;
 | 
						|
        }
 | 
						|
        elsif(/^Source: *(.*)/i) {
 | 
						|
            $source=$1;
 | 
						|
        }
 | 
						|
        elsif(/^See-also: +(.*)/i) {
 | 
						|
            $list = 1; # 1 for see-also
 | 
						|
            push @seealso, $1;
 | 
						|
        }
 | 
						|
        elsif(/^See-also: */i) {
 | 
						|
            if($seealso[0]) {
 | 
						|
                print STDERR "$f:$line:1:ERROR: bad See-Also, needs list\n";
 | 
						|
                return 2;
 | 
						|
            }
 | 
						|
            $list = 1; # 1 for see-also
 | 
						|
        }
 | 
						|
        elsif(/^Protocol:/i) {
 | 
						|
            $list = 2; # 2 for protocol
 | 
						|
        }
 | 
						|
        elsif(/^TLS-backend:/i) {
 | 
						|
            $list = 3; # 3 for TLS backend
 | 
						|
        }
 | 
						|
        elsif(/^ +- (.*)/i) {
 | 
						|
            # the only lists we support are see-also and protocol
 | 
						|
            if($list == 1) {
 | 
						|
                push @seealso, $1;
 | 
						|
            }
 | 
						|
            elsif($list == 2) {
 | 
						|
                push @proto, $1;
 | 
						|
            }
 | 
						|
            elsif($list == 3) {
 | 
						|
                push @tls, $1;
 | 
						|
            }
 | 
						|
            else {
 | 
						|
                print STDERR "$f:$line:1:ERROR: list item without owner?\n";
 | 
						|
                return 2;
 | 
						|
            }
 | 
						|
        }
 | 
						|
        # REUSE-IgnoreStart
 | 
						|
        elsif(/^C: (.*)/i) {
 | 
						|
            $copyright=$1;
 | 
						|
        }
 | 
						|
        elsif(/^SPDX-License-Identifier: (.*)/i) {
 | 
						|
            $spdx=$1;
 | 
						|
        }
 | 
						|
        # REUSE-IgnoreEnd
 | 
						|
        elsif(/^---/) {
 | 
						|
            # end of the header section
 | 
						|
            if(!$title) {
 | 
						|
                print STDERR "ERROR: no 'Title:' in $f\n";
 | 
						|
                return 1;
 | 
						|
            }
 | 
						|
            if(!$section) {
 | 
						|
                print STDERR "ERROR: no 'Section:' in $f\n";
 | 
						|
                return 2;
 | 
						|
            }
 | 
						|
            if(!$seealso[0]) {
 | 
						|
                print STDERR "$f:$line:1:ERROR: no 'See-also:' present\n";
 | 
						|
                return 2;
 | 
						|
            }
 | 
						|
            if(!$copyright) {
 | 
						|
                print STDERR "$f:$line:1:ERROR: no 'C:' field present\n";
 | 
						|
                return 2;
 | 
						|
            }
 | 
						|
            if(!$spdx) {
 | 
						|
                print STDERR "$f:$line:1:ERROR: no 'SPDX-License-Identifier:' field present\n";
 | 
						|
                return 2;
 | 
						|
            }
 | 
						|
            if($section == 3) {
 | 
						|
                if(!$proto[0]) {
 | 
						|
                    printf STDERR "$f:$line:1:ERROR: missing Protocol:\n";
 | 
						|
                    exit 2;
 | 
						|
                }
 | 
						|
                my $tls = 0;
 | 
						|
                for my $p (@proto) {
 | 
						|
                    if($p eq "TLS") {
 | 
						|
                        $tls = 1;
 | 
						|
                    }
 | 
						|
                    if(!$knownprotos{$p}) {
 | 
						|
                        printf STDERR "$f:$line:1:ERROR: invalid protocol used: $p:\n";
 | 
						|
                        exit 2;
 | 
						|
                    }
 | 
						|
                }
 | 
						|
                # This is for TLS, require TLS-backend:
 | 
						|
                if($tls) {
 | 
						|
                    if(!$tls[0]) {
 | 
						|
                        printf STDERR "$f:$line:1:ERROR: missing TLS-backend:\n";
 | 
						|
                        exit 2;
 | 
						|
                    }
 | 
						|
                    for my $t (@tls) {
 | 
						|
                        if(!$knowntls{$t}) {
 | 
						|
                            printf STDERR "$f:$line:1:ERROR: invalid TLS backend: $t:\n";
 | 
						|
                            exit 2;
 | 
						|
                        }
 | 
						|
                    }
 | 
						|
                }
 | 
						|
            }
 | 
						|
            last;
 | 
						|
        }
 | 
						|
        else {
 | 
						|
            chomp;
 | 
						|
            print STDERR "WARN: unrecognized line in $f, ignoring:\n:'$_';"
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    if(!$start) {
 | 
						|
        print STDERR "$f:$line:1:ERROR: no header present\n";
 | 
						|
        return 2;
 | 
						|
    }
 | 
						|
 | 
						|
    my @desc;
 | 
						|
    my $quote = 0;
 | 
						|
    my $blankline = 0;
 | 
						|
    my $header = 0;
 | 
						|
 | 
						|
    # cut off the leading path from the file name, if any
 | 
						|
    $f =~ s/^(.*[\\\/])//;
 | 
						|
 | 
						|
    push @desc, ".\\\" generated by cd2nroff $cd2nroff from $f\n";
 | 
						|
    push @desc, ".TH $title $section \"$date\" $source\n";
 | 
						|
    while(<$fh>) {
 | 
						|
        $line++;
 | 
						|
 | 
						|
        $d = $_;
 | 
						|
 | 
						|
        if($quote) {
 | 
						|
            if($quote == 4) {
 | 
						|
                # remove the indentation
 | 
						|
                if($d =~ /^    (.*)/) {
 | 
						|
                    push @desc, "$1\n";
 | 
						|
                    next;
 | 
						|
                }
 | 
						|
                else {
 | 
						|
                    # end of quote
 | 
						|
                    $quote = 0;
 | 
						|
                    push @desc, ".fi\n";
 | 
						|
                    next;
 | 
						|
                }
 | 
						|
            }
 | 
						|
            if(/^~~~/) {
 | 
						|
                # end of quote
 | 
						|
                $quote = 0;
 | 
						|
                push @desc, ".fi\n";
 | 
						|
                next;
 | 
						|
            }
 | 
						|
            # convert single backslahes to doubles
 | 
						|
            $d =~ s/\\/\\\\/g;
 | 
						|
            # lines starting with a period needs it escaped
 | 
						|
            $d =~ s/^\./\\&./;
 | 
						|
            push @desc, $d;
 | 
						|
            next;
 | 
						|
        }
 | 
						|
 | 
						|
        # remove single line HTML comments
 | 
						|
        $d =~ s/<!--.*?-->//g;
 | 
						|
 | 
						|
        # **bold**
 | 
						|
        $d =~ s/\*\*(\S.*?)\*\*/\\fB$1\\fP/g;
 | 
						|
        # *italics*
 | 
						|
        $d =~ s/\*(\S.*?)\*/\\fI$1\\fP/g;
 | 
						|
 | 
						|
        if($d =~ /[^\\][\<\>]/) {
 | 
						|
            print STDERR "$f:$line:1:WARN: un-escaped < or > used\n";
 | 
						|
        }
 | 
						|
        # convert backslash-'<' or '> to just the second character
 | 
						|
        $d =~ s/\\([<>])/$1/g;
 | 
						|
 | 
						|
        # mentions of curl symbols with man pages use italics by default
 | 
						|
        $d =~ s/((lib|)curl([^ ]*\(3\)))/\\fI$1\\fP/gi;
 | 
						|
 | 
						|
        # backticked becomes italics
 | 
						|
        $d =~ s/\`(.*?)\`/\\fI$1\\fP/g;
 | 
						|
 | 
						|
        if(/^## (.*)/) {
 | 
						|
            my $word = $1;
 | 
						|
            # if there are enclosing quotes, remove them first
 | 
						|
            $word =~ s/[\"\'\`](.*)[\"\'\`]\z/$1/;
 | 
						|
 | 
						|
            # enclose in double quotes if there is a space present
 | 
						|
            if($word =~ / /) {
 | 
						|
                push @desc, ".IP \"$word\"\n";
 | 
						|
            }
 | 
						|
            else {
 | 
						|
                push @desc, ".IP $word\n";
 | 
						|
            }
 | 
						|
            $header = 1;
 | 
						|
        }
 | 
						|
        elsif(/^# (.*)/) {
 | 
						|
            my $word = $1;
 | 
						|
            # if there are enclosing quotes, remove them first
 | 
						|
            $word =~ s/[\"\'](.*)[\"\']\z/$1/;
 | 
						|
 | 
						|
            if($word eq "PROTOCOLS") {
 | 
						|
                print STDERR "$f:$line:1:WARN: PROTOCOLS section in source file\n";
 | 
						|
            }
 | 
						|
            elsif($word eq "EXAMPLE") {
 | 
						|
                # insert the generated PROTOCOLS section before EXAMPLE
 | 
						|
                push @desc, outprotocols(@proto);
 | 
						|
 | 
						|
                if($proto[0] eq "TLS") {
 | 
						|
                    push @desc, outtls(@tls);
 | 
						|
                }
 | 
						|
            }
 | 
						|
            push @desc, ".SH $word\n";
 | 
						|
            $header = 1;
 | 
						|
        }
 | 
						|
        elsif(/^~~~c/) {
 | 
						|
            # start of a code section, not indented
 | 
						|
            $quote = 1;
 | 
						|
            push @desc, "\n" if($blankline && !$header);
 | 
						|
            $header = 0;
 | 
						|
            push @desc, ".nf\n";
 | 
						|
        }
 | 
						|
        elsif(/^~~~/) {
 | 
						|
            # start of a quote section; not code, not indented
 | 
						|
            $quote = 1;
 | 
						|
            push @desc, "\n" if($blankline && !$header);
 | 
						|
            $header = 0;
 | 
						|
            push @desc, ".nf\n";
 | 
						|
        }
 | 
						|
        elsif(/^    (.*)/) {
 | 
						|
            # quoted, indented by 4 space
 | 
						|
            $quote = 4;
 | 
						|
            push @desc, "\n" if($blankline && !$header);
 | 
						|
            $header = 0;
 | 
						|
            push @desc, ".nf\n$1\n";
 | 
						|
        }
 | 
						|
        elsif(/^[ \t]*\n/) {
 | 
						|
            # count and ignore blank lines
 | 
						|
            $blankline++;
 | 
						|
        }
 | 
						|
        else {
 | 
						|
            # don't output newlines if this is the first content after a
 | 
						|
            # header
 | 
						|
            push @desc, "\n" if($blankline && !$header);
 | 
						|
            $blankline = 0;
 | 
						|
            $header = 0;
 | 
						|
 | 
						|
            # quote minuses in the output
 | 
						|
            $d =~ s/([^\\])-/$1\\-/g;
 | 
						|
            # replace single quotes
 | 
						|
            $d =~ s/\'/\\(aq/g;
 | 
						|
            # handle double quotes first on the line
 | 
						|
            $d =~ s/^(\s*)\"/$1\\&\"/;
 | 
						|
 | 
						|
            # lines starting with a period needs it escaped
 | 
						|
            $d =~ s/^\./\\&./;
 | 
						|
 | 
						|
            if($d =~ /^(.*)  /) {
 | 
						|
                printf STDERR "$f:$line:%d:ERROR: 2 spaces detected\n",
 | 
						|
                    length($1);
 | 
						|
                $errors++;
 | 
						|
            }
 | 
						|
            if($d =~ /^[ \t]*\n/) {
 | 
						|
                # replaced away all contents
 | 
						|
                $blankline= 1;
 | 
						|
            }
 | 
						|
            else {
 | 
						|
                push @desc, $d;
 | 
						|
            }
 | 
						|
        }
 | 
						|
    }
 | 
						|
    if($fh != \*STDIN) {
 | 
						|
        close($fh);
 | 
						|
    }
 | 
						|
    push @desc, outseealso(@seealso);
 | 
						|
    if($dir) {
 | 
						|
        if($keepfilename) {
 | 
						|
            $title = $f;
 | 
						|
            $title =~ s/\.[^.]*$//;
 | 
						|
        }
 | 
						|
        my $outfile = "$dir/$title.$section";
 | 
						|
        if(defined($extension)) {
 | 
						|
            $outfile .= $extension;
 | 
						|
        }
 | 
						|
        if(!open(O, ">", $outfile)) {
 | 
						|
            print STDERR "Failed to open $outfile : $!\n";
 | 
						|
            return 1;
 | 
						|
        }
 | 
						|
        print O @desc;
 | 
						|
        close(O);
 | 
						|
    }
 | 
						|
    else {
 | 
						|
        print @desc;
 | 
						|
    }
 | 
						|
    return $errors;
 | 
						|
}
 | 
						|
 | 
						|
if(@ARGV) {
 | 
						|
    for my $f (@ARGV) {
 | 
						|
        my $r = single($f);
 | 
						|
        if($r) {
 | 
						|
            exit $r;
 | 
						|
        }
 | 
						|
    }
 | 
						|
}
 | 
						|
else {
 | 
						|
    exit single();
 | 
						|
}
 |