#!/bin/sh # # Copyright (C) 2001-2007 Graeme Walker # # This program is free software: you can redistribute it and/or modify # it under the terms of the GNU General Public License as published by # the Free Software Foundation, either version 3 of the License, or # (at your option) any later version. # # This program is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU General Public License for more details. # # You should have received a copy of the GNU General Public License # along with this program. If not, see . # === # # mu2docbook.sh # # Mark-up to docbook converter. Converts the output of "txt2mu.sh" # into docbook markup. # # Does some in-line formatting independently of the line-based # mark-up in the input. For example, it converts quoted words into # "" tags, and it converts "*foo* [bar]" text into # hypertext links. # # The "-x" flag suppresses the output of the xml header. This is # useful when the output is to be spliced into another document. # # usage: mu2docbook.sh [-a ] [{-x|--head|--tail}] [] # # (If the title is not supplied then the input is copied # to a temporary file in order to extract the H1 header # text for the title.) # awk="gawk" if test "${1}" = "-a" then shift if test "${1}" != "" ; then awk="${1}" ; fi shift fi full="1" if test "${1}" = "-x" then full="0" shift fi op="" if test "${1}" = "--head" then shift op="head" elif test "${1}" = "--tail" then shift op="tail" fi title="${1}" Head() { echo '' | ${awk} -v prefix="`basename $0`" -v title="${1}" -v full="${2}" ' BEGIN { if( full ) { dtd_name="-//OASIS//DTD DocBook XML V4.1.2//EN" dtd_ref="http://www.oasis-open.org/docbook/xml/4.1.2/docbookx.dtd" qq="\"" printf( "%s\n" , "<?xml version=\"1.0\"?>" ) printf( "<!DOCTYPE article PUBLIC \"%s\" \"%s\">\n" , dtd_name , dtd_ref ) printf( "<article>\n" ) printf( " <articleinfo>\n" ) ; printf( " <title>%s\n" , title ) printf( " \n" ) } } ' } Tail() { echo '' | ${awk} -v prefix="`basename $0`" -v title="${1}" -v full="${2}" ' BEGIN { if( full ) { printf( "\n" ) } } ' } Body() { ${awk} -v prefix="`basename $0`" -v title="${1}" -v full="${2}" ' function arg1( type ) { sub( "[^,]*," , "" , type ) sub( ",.*" , "" , type ) return type } function arg2( type ) { sub( "[^,]*," , "" , type ) sub( "[^,]*," , "" , type ) sub( ",.*" , "" , type ) return type } function escape( line ) { gsub( "&" , "\\&" , line ) gsub( "<" , "\\<" , line ) gsub( ">" , "\\>" , line ) return line } function dequote( line ) { quote = "\"" not_quote = "[^" quote "]" start_tag="" end_tag="" gsub( quote not_quote "*" quote , start_tag "&" end_tag , line ) gsub( start_tag quote , start_tag , line ) gsub( quote end_tag , end_tag , line ) return line } function fn( line ) { gsub( "[^[:space:]][^[:space:]]*\\(\\)" , "&" , line ) return line } { pos = index( $0 , ":" ) type = substr( $0 , 1 , pos ) tail = substr( $0 , pos+1 ) etail_raw = escape(tail) etail = fn(dequote(escape(tail))) # h1 if( match(type,"^h1[:,]") ) { if( done_h2 ) printf( " \n" ) if( done_h1 ) printf( " \n" ) printf( "
%s\n" , etail ) done_h1 = 1 done_h2 = 0 } # h2 else if( match(type,"^h2[:,]") ) { if( done_h2 ) printf( "
\n" , etail ) printf( "
%s\n" , etail ) done_h2 = 1 } # item else if( match(type,"^item,1[:,]") ) printf( " \n %s\n" , etail ) else if( match(type,"^item[:,]") ) printf( " %s\n" , etail ) else if( match(type,"^item-end[:,]") ) printf( " \n" , etail ) # item-numbered else if( match(type,"^item-numbered,1[:,]") ) printf( " \n %s\n" , etail ) else if( match(type,"^item-numbered[:,]") ) printf( " %s\n" , etail ) else if( match(type,"^item-numbered-end[:,]") ) printf( " \n" , etail ) # item-outer else if( match(type,"^item-outer,1[:,]") ) printf( " \n %s\n" , etail ) else if( match(type,"^item-outer[:,]") ) printf( " \n %s\n" , etail ) else if( match(type,"^item-outer-end[:,]") ) printf( " \n \n" , etail ) # item-inner else if( match(type,"^item-inner,1[:,]") ) printf( " \n %s\n" , etail ) else if( match(type,"^item-inner[:,]") ) printf( " %s\n" , etail ) else if( match(type,"^item-inner-end[:,]") ) printf( " \n" , etail ) # item-name else if( match(type,"^item-name,1[:,]") ) printf( " \n %s\n" , etail ) else if( match(type,"^item-name[:,]") ) printf( " \n %s\n" , etail ) else if( match(type,"^item-name-end[:,]") ) printf( " \n \n" , etail ) # item-detail else if( match(type,"^item-detail,1[:,]") ) printf( " \n %s\n" , etail ) else if( match(type,"^item-detail[:,]") ) printf( " %s\n" , etail ) else if( match(type,"^item-detail-end[:,]") ) printf( " \n" ) else if( match(type,"^item-detail-blank[:,]") ) printf( " \n" ) # code else if( match(type,"^code,1[:,]") ) printf( " %s" , etail_raw ) else if( match(type,"^code[:,]") ) printf( "\n%s" , etail_raw ) else if( match(type,"^code-end[:,]") ) printf( "\n" ) # text else if( match(type,"^text,1[:,]") ) printf( " \n %s\n" , etail ) else if( match(type,"^text[:,]") ) printf( " %s\n" , etail ) else if( match(type,"^text-end[:,]") ) printf( " \n" ) # footer-text else if( match(type,"^footer,1[:,]") ) printf( " \n %s\n" , etail ) else if( match(type,"^footer[:,]") ) printf( " %s\n" , etail ) else if( match(type,"^footer-end[:,]") ) printf( " \n" ) # citation-text else if( match(type,"^citation,1[:,]") ) printf( "

\n %s\n" , etail ) else if( match(type,"^citation[:,]") ) printf( " %s\n" , etail ) else if( match(type,"^citation-end[:,]") ) printf( "

\n" ) # author-text else if( match(type,"^author,1[:,]") ) printf( " \n %s\n" , etail ) else if( match(type,"^author[:,]") ) printf( " %s\n" , etail ) else if( match(type,"^author-end[:,]") ) printf( " \n" ) # html else if( match(type,"^html[:,]") ) printf( "%s\n" , tail ) # image else if( match(type,"^image[:,]") ) printf( "\n" , tail ) # blank else if( match(type,"^blank[:,]") ) printf( "\n" ) # ignore else if( match(type,"^ignore") ) printf( "" ) else if( match(type,"[^[:space:]]") ) printf( "%s: unrecognised mark-up tag on line %d: \"%s\"\n" , prefix , NR , type )>"/dev/fd/2" } END { if( done_h2 ) printf( "
\n" ) if( done_h1 ) printf( " \n" ) } ' Tail } Main() { Head "${title}" "${full}" Body "${title}" "${full}" Tail "${title}" "${full}" } Anchorise() { sed 's/\*\([^\*]*\)\* \[\([^]]*\)\]/\1<\/ulink>/g' } if test "${op}" = "head" then Head "${title}" "${full}" elif test "${op}" = "tail" then Tail "${title}" "${full}" elif test "${title}" = "" then tmp="`basename $0`.tmp" ${awk} '{print}' > ${tmp} title="`${awk} '/^h1/ { sub(\"[^:]*:\",\"\") ; print ; exit }' ${tmp}`" ${awk} '{print}' ${tmp} | Main "${title}" "${full}" | Anchorise rm -f ${tmp} else Main "${title}" "${full}" | Anchorise fi