! (c)2010 Joe Groff bsd license USING: accessors arrays assocs calendar calendar.format combinators combinators.short-circuit fry io io.directories io.encodings.binary io.encodings.detect io.encodings.utf8 io.files io.files.info io.files.types io.pathnames kernel locals math math.parser sequences sorting strings unicode.categories xml.syntax xml.writer xmode.catalog xmode.marker xmode.tokens ; IN: codebook ! Usage: "my/source/tree" utf8 "dest" codebook ! Writes tree.opf, tree.ncx, and tree.html to the "dest" directory ! Use kindlegen -unicode dest/tree.opf to compile tree.mobi file for Kindle CONSTANT: codebook-style { { COMMENT1 [ [XML <-> XML] ] } { COMMENT2 [ [XML <-> XML] ] } { COMMENT3 [ [XML <-> XML] ] } { COMMENT4 [ [XML <-> XML] ] } { DIGIT [ [XML <-> XML] ] } { FUNCTION [ [XML <-> XML] ] } { KEYWORD1 [ [XML <-> XML] ] } { KEYWORD2 [ [XML <-> XML] ] } { KEYWORD3 [ [XML <-> XML] ] } { KEYWORD4 [ [XML <-> XML] ] } { LABEL [ [XML <-> XML] ] } { LITERAL1 [ [XML <-> XML] ] } { LITERAL2 [ [XML <-> XML] ] } { LITERAL3 [ [XML <-> XML] ] } { LITERAL4 [ [XML <-> XML] ] } { MARKUP [ [XML <-> XML] ] } { OPERATOR [ [XML <-> XML] ] } [ drop ] } : first-line ( filename encoding -- line ) [ readln ] with-file-reader ; TUPLE: code-file name encoding mode ; : include-file-name? ( name -- ? ) { [ path-components [ "." head? ] any? not ] [ link-info type>> +regular-file+ = ] } 1&& ; : code-files ( dir -- files ) '[ [ include-file-name? ] filter [ dup detect-file dup binary? [ f ] [ 2dup dupd first-line find-mode ] if code-file boa ] map [ mode>> ] filter [ name>> ] sort-with ] with-directory-tree-files ; : html-name-char ( char -- str ) { { [ dup alpha? ] [ 1string ] } { [ dup digit? ] [ 1string ] } [ >hex 6 CHAR: 0 pad-head "_" "_" surround ] } cond ; : file-html-name ( name -- name ) [ html-name-char ] { } map-as concat ".html" append ; : toc-list ( files -- list ) [ name>> ] map natural-sort [ [ file-html-name ] keep [XML
  • ><->
  • XML] ] map ; ! insert zero-width non-joiner between all characters so words can wrap anywhere : zwnj ( string -- s|t|r|i|n|g ) [ CHAR: \u00200c "" 2sequence ] { } map-as concat ; ! We wrap every line in because Kindle tends to forget the font when ! moving back pages : htmlize-tokens ( tokens line# -- html-tokens ) swap [ [ str>> zwnj ] [ id>> ] bi codebook-style case ] map [XML <-> <-> XML] "\n" 2array ; : line#>string ( i line#len -- i-string ) [ number>string ] [ CHAR: \s pad-head ] bi* ; :: code>html ( dir file -- page ) file name>> :> name "Generating HTML for " write name write "..." print flush dir [ file [ name>> ] [ encoding>> ] bi file-lines ] with-directory :> lines lines length 1 + number>string length :> line#len file mode>> load-mode :> rules f lines [| l i | l rules tokenize-line i 1 + line#len line#>string htmlize-tokens ] map-index concat nip :> html-lines <-name->

    <-name->

    <-html-lines->
    XML> ; :: code>toc-html ( dir name files -- html ) "Generating HTML table of contents" print flush now timestamp>rfc822 :> timestamp dir absolute-path :> source dir [ files toc-list :> toc <-name->

    <-name->

    Generated from
    <-source->
    at <-timestamp->


      <-toc->
    XML> ] with-directory ; :: code>ncx ( dir name files -- xml ) "Generating NCX table of contents" print flush files [| file i | file name>> :> name name file-html-name :> filename i 2 + number>string :> istr [XML playOrder=<-istr->> <-name-> /> XML] ] map-index :> file-nav-points Table of Contents <-file-nav-points-> XML> ; :: code>opf ( dir name files -- xml ) "Generating OPF manifest" print flush name ".ncx" append :> ncx-name files [ name>> file-html-name dup [XML href=<-> media-type="text/html" /> XML] ] map :> html-manifest files [ name>> file-html-name [XML /> XML] ] map :> html-spine > <-name-> en <-html-manifest-> media-type="application/x-dtbncx+xml" /> <-html-spine-> XML> ; : write-dest-file ( xml dest-dir name ext -- ) append append-path utf8 [ write-xml ] with-file-writer ; :: codebook ( src-dir dest-dir -- ) "Generating ebook for " write src-dir write " in " write dest-dir print flush dest-dir make-directories src-dir file-name :> name src-dir code-files :> files src-dir name files code>opf dest-dir name ".opf" write-dest-file src-dir name files code>ncx dest-dir name ".ncx" write-dest-file src-dir name files code>toc-html dest-dir "_toc.html" "" write-dest-file files [| file | src-dir file code>html dest-dir file name>> file-html-name "" write-dest-file ] each "Job's finished" print flush ;