]> www.wagner.pp.ru Git - fiction/Kate-the-Empress.git/blobdiff - Tex2fb2
Merge branch 'master' of https://www.wagner.pp.ru/git/fiction/Kate-the-Empress
[fiction/Kate-the-Empress.git] / Tex2fb2
diff --git a/Tex2fb2 b/Tex2fb2
index 693149fcdc401644ad80bda7cf08af16a61a47eb..96279b391b0062e4b4afdb8b8e21ceddb3366ecd 100755 (executable)
--- a/Tex2fb2
+++ b/Tex2fb2
@@ -1,26 +1,50 @@
 #!/usr/bin/perl -CDS
 use utf8;
+use POSIX qw(strftime);
+use MIME::Base64;
 # char-level modes
 my $poetry = 0;
 my $verbatim = 0;
 my @sections;
 my $buffer;
+my $idseq = 0; # sequentual number of footnotes
+my $footnotes="";
 #
 # TODO italic paragaphs
 # footnotes
 # epigraphs
 #
 # print fictionbook header
-print "<?xml version=\"1.0\" encoding=\"UTF-8\">\n";
+print "<?xml version=\"1.0\" encoding=\"UTF-8\"?>\n";
 print "<FictionBook xmlns=\"http://www.gribuser.ru/xml/fictionbook/2.0\"
 xmlns:l=\"http://www.w3.org/1999/xlink\">\n";
 my $metadata = shift @ARGV;
 open F,"<",$metadata;
+my $pics = "";
 while (<F>) {
+       # Replace empty date with current date
+       if (/<date\s+\/>/ || /<date>\s*<\/date>/) {
+               $_ = "<date value=\"".strftime("%Y-%m-%d",localtime())."\">".
+                       strftime("%d/%m/%Y",localtime())."</date>\n";
+       }
+       # Add current to date as fractional part to version
+       if (/<version>(\d*)(.\d*)?<\/version>/) {
+               my $ver = $1+time()/1E10;
+               $_=tag(sprintf("%g",$ver),"version")."\n";
+       }
+       # Если  существует cover.png, добавляем coverpage
+       if (/<coverpage \/>/) {
+               $_="";
+               if (-f "cover.png") { 
+                       my $id = "cover_png";
+                       $_ = "<coverpage>\n<image l:href=\"#$id\" />\n</coverpage>\n";
+                       $pics .= mkbinary("cover.png",$id);
+               }
+       }
        print $_;
 }
 close F;
-
+print "<body>\n";
 my $header =1;
 LINE:
 while (<>) {
@@ -46,17 +70,17 @@ if (/\\(begin|end){(\w+)}/) {
 next LINE if $header;
 if ((/^$/ || $environ) && $buffer) {
 #output on empty line (p or stanza) depending on poetry mode
-       add_to_section(tag($buffer,$poetry?"stanza":"p")."\n");
+       add_to_section(tag(flushbuffer($buffer),$poetry?"stanza":"p")."\n");
        $buffer="";
 }
 next LINE if $environ;
 # Section headings
 if (/\\(part|chapter|section|subsection|subsubsection)\*?{(.*)}/) {
        if ($buffer) {
-               add_to_section(tag($buffer,$poetry?"stanza":"p"));
+               add_to_section(tag(flushbuffer($buffer),$poetry?"stanza":"p"));
                $buffer="";
        }
-       pushsection($1,$2);
+       pushsection($1,tag($2,"p"));
        next LINE;
 }
 if (/\\vspace{/) {
@@ -64,6 +88,12 @@ if (/\\vspace{/) {
        next LINE;
 }
 next LINE if /\\pagebreak\b/;
+#replace ' and " with entities
+s/&/&amp;/g;
+s/'/&apos;/g;
+s/"/&quot;/g;
+s/</&lt;/g;
+s/>/&gt;/g;
 #normal mode: 
 if (!$verbatim) {
 #strip TeX comments 
@@ -79,21 +109,26 @@ s/\s+$//;
 s/(\s)\s+/$1/g;
 #replace TeX ligatures ~ --- << >> \% with appropriate unicode symbols
 s/~/\xA0/g;
-s/---/-/g;
+s/\\-/\xAD/g;
+s/---/—/g;
 s/<</«/g;
 s/>>/»/g;
 s/\\%/%/g;
 s/\\dots/\x{2026}/g;
+s/\\verb(.)(.*)\1/<code>$2<\/code>/;
 }
-#replace ' and " with entities
-s/&/&amp;/g;
-s/'/&apos;/g;
-s/"/&quot;/g;
-s/</&lt;/g;
-s/>/&gt;/g;
 
 if ($poetry) {
        chomp;
+       if ($poetic_buffer) {
+               $_ = $poetic_buffer." ".$_;
+               $poetic_buffer = undef;
+       }
+       if (/{[^}]+$/) {
+               $poetic_buffer=$_;
+               next LINE;
+       }
+       s/\\footnote{(.*)}/push_footnote($1)/e;
        s/\s*\\\\$//;
   $buffer.=tag($_,'v')."\n";
 } elsif ($verbatim) {
@@ -103,7 +138,7 @@ if ($poetry) {
 }
 }
 if ($buffer) {
-       add_to_section(tag($buffer,"p"));
+       add_to_section(tag(flushbuffer($buffer),"p"));
        $buffer="";
 }
 
@@ -111,12 +146,17 @@ while (@sections) {
        flushsection();
 }
 print "</body>\n";
-## FIXME print footnotes
+## print footnotes
+print "<body>\n$footnotes\n</body>" if $footnotes;
+print $pics;
 print "</FictionBook>";
 
 sub add_to_section {
        my $data = shift;
        return if ($#sections<0) ;
+       if ($data =~ /^\s*<section>/ && $sections[$#sections]->{data} !~ /^\s*<section>/) {
+               $sections[$#sections]->{data} = tag($sections[$#sections]->{data},"section")."\n";
+       }       
        $sections[$#sections]->{data}.=$data;
 }
 
@@ -127,7 +167,11 @@ sub flushsection {
        if ($str->{title}) {
                $content = tag($str->{title},"title");
        }
-       $content .=  $str->{data};
+       if ($str->{data} =~ /^\s*$/s) {
+               $content .= "<p>\n</p>";
+       } else {
+               $content .=  $str->{data};
+       }
        if ($#sections >=0) {
                add_to_section(tag($content,$tag)."\n");
        } else {
@@ -155,6 +199,34 @@ sub pushsection {
 
 sub tag {
        my ($content,$name) = @_;
-       return "" if $content =~ /^\s*$/s;
+       $content =~s/^\s+//s;
+       return "" unless $content;
        return "<$name>$content</$name>";
 }
+
+sub flushbuffer {
+       local $_ = shift;
+       s/{\\(em|it|bf)(?:\s+|{})([^{}]+)}/<emphasis>$2<\/emphasis>/g;
+       s/\\(emph|textit|textbf){([^{}]+)}/<emphasis>$2<\/emphasis>/g;
+       s/\\footnote{(.*)}/push_footnote($1)/e;
+       s/[{}]//g;
+       return $_;
+}
+
+
+sub push_footnote {
+       my $id = "note_".(++$idseq);
+       $footnotes.="<section id=\"$id\">".tag(shift,'p')."</section>\n";
+       return "<a l:href=\"#$id\" type=\"note\">$idseq</a>";
+}
+
+sub mkbinary {
+       my ($filename,$id) = @_;
+       my $f;
+       open $f,"<",$filename;
+       binmode $f;
+       local $/;
+       my $data = encode_base64(<$f>);
+       return "<binary id=\"$id\" content-type=\"image/png\">$data</binary>\n";
+       close $f;
+}