#!/usr/bin/perl -w
#
# gbtoxhtml.pl
#
#####
use strict;
delete @ENV{qw(PATH IFS CDPATH ENV BASH_ENV)}; # clean house for taint mode
my $PROGRAM_NAME = 'gbtoxhtml';
my $USAGE = "$PROGRAM_NAME [options] book-code\n\t--meta=[metadata file]\n\t--xml=[book XML]\n\t--xsl=[XSL transformation]\n\t--language=[language area of input data (output determined by meta file)]\n\t--verbose\n";
my $FILENAME_SEPARATOR = '/';
my $RXP = '/usr/bin/rxp';
my $CP = '/bin/cp';
my $MV = '/bin/mv';
my $TAR = '/bin/tar';
my $ZIP = '/usr/bin/zip';
my $BZIP2 = '/bin/bzip2';
my $JAVA = '/usr/bin/java';
my $XALAN_JAR = '/usr/share/java/xalan2.jar';
my $RM = '/bin/rm';
my $CHMOD = '/bin/chmod';
# Check that all the binaries are were want them
my @BINARIES;
push @BINARIES, ($RXP, $CP, $MV, $TAR, $ZIP, $BZIP2, $JAVA, $XALAN_JAR, $RM, $CHMOD);
foreach (@BINARIES) {
if ( ! -e $_ ) {
die "$PROGRAM_NAME: Cannot find binary '".$_."'. Please install it.\n";
}
}
###
my $bookCode = '';
my $metaFile = '';
my $bookXML = '';
my $xhtmlXSL = 'common/xsl/xhtml.xsl';
my $language = 'en';
my $verbose = 0;
while( $#ARGV > -1 ) {
my $cmdLineItem = shift @ARGV;
if( $cmdLineItem =~ /^--meta=(.+)$/ ) {
$metaFile = $1;
}
elsif( $cmdLineItem =~ /^--xml=(.+)$/ ) {
$bookXML = $1;
}
elsif( $cmdLineItem =~ /^--xsl=(.+)$/ ) {
$xhtmlXSL = $1;
}
elsif( $cmdLineItem =~ /^--language=(.+)$/ ) {
$language = $1;
}
elsif( $cmdLineItem =~ /^--verbose/ ) {
$verbose = 1;
}
else {
$bookCode = $cmdLineItem;
}
}
if( $bookCode eq '' ) { die "Unspecified book code\n$USAGE"; }
if( $metaFile eq '' ) { $metaFile = "$language/.publisher/rules/standard"; }
if( $bookXML eq '' ) { $bookXML = "$language/xml/$bookCode.xml"; }
if( $xhtmlXSL eq '' ) { die "Unspecified XSL transformation file\n$USAGE"; }
if( -e $metaFile && -f $metaFile && -r $metaFile ) {
open( META, '<', $metaFile ) or die qq{Unable to open metadata file ($metaFile): $!\n};
}
else { die qq{Improper metadata file ($metaFile)\n}; }
my $meta = '';
while( my $line = ) {
$meta .= $line if $line !~ /^[[:space:]]*#/;
}
close META;
my $rulesString = '';
if( $meta =~ /^[[:space:]]*$bookCode[[:space:]]*{([^}]*)}/sm ) {
$rulesString = $1;
}
else {
die "Book code ($bookCode) not found in metadata file or invalid file syntax\n";
}
my @rules = split( /[[:space:]\n]*;[[:space:]\n]*/, $rulesString );
my %rulesHash;
foreach my $rule (@rules) {
if( $rule =~ /[[:space:]]*([^:]+)[[:space:]]*:[[:space:]]*(.+)$/s ) {
$rulesHash{ $1 } = $2;
}
else {
die "Unrecognized rule syntax:\n$rule\n";
}
}
if( $bookXML =~ m{^([-\w\@./]+)$} ) {
$bookXML = $1;
unless( -e $bookXML && -f $bookXML && -r $bookXML ) {
die "XML does not exist or is not readable\n";
}
if( -e $RXP ) {
system( $RXP, '-Vs', $bookXML ) == 0
or die "XML validation failed\n";
}
else {
warn "XML Validator ($RXP) not installed - validate before publication\n";
}
unless( defined $rulesHash{'language'} ) { die "Metadata file leaves language unspecified\n"; }
unless( defined $rulesHash{'book-series'} ) { die "Metadata file leaves book series unspecified\n"; }
unless( defined $rulesHash{'images'} ) { die "Metadata file leaves image directories unspecified\n"; }
unless( defined $rulesHash{'csst'} ) { die "Metadata file leaves CSS templates unspecified\n"; }
my $outPath = $rulesHash{'language'} . $FILENAME_SEPARATOR . 'xhtml' . $FILENAME_SEPARATOR . $rulesHash{'book-series'} .$FILENAME_SEPARATOR . $bookCode;
unless( -e $outPath && -d $outPath ) {
my @dirs = split ( /$FILENAME_SEPARATOR/, $outPath );
my $dirPath = '';
for( my $i = 0; $i <= $#dirs; ++$i ) {
$dirPath .= $dirs[$i] . $FILENAME_SEPARATOR;
if( -e $dirPath && ! -d $dirPath ) { die "Output directory name exists and is not a directory\n"; }
unless( -e $dirPath ) {
mkdir $dirPath or die( "Unable to create output directory ($outPath): $!\n" );
}
}
}
unless( -e $outPath && -d $outPath ) {
die "Unknown error creating output directory\n";
}
my $bookPath = "$outPath${FILENAME_SEPARATOR}";
print qx{$RM ${bookPath}*} if -e $bookPath."/toc.htm";
print qx{$JAVA -classpath "$XALAN_JAR" org.apache.xalan.xslt.Process -IN "$bookXML" -XSL "$xhtmlXSL" -OUT "${bookPath}foo.xml" -PARAM background-color "$rulesHash{'background-color'}" -PARAM text-color "$rulesHash{'text-color'}" -PARAM link-color "$rulesHash{'link-color'}" -PARAM use-illustrators "$rulesHash{'use-illustrators'}" -PARAM language "$rulesHash{'language'}"};
print qx{$RM ${bookPath}foo.xml};
foreach my $cssTemplate (split( /:/, $rulesHash{'csst'} )) {
$cssTemplate =~ m/([^${FILENAME_SEPARATOR}]+)t$/;
my $templateFilename = $1;
open( TEMPLATE, '<', $cssTemplate ) or die "Unable to open CSS template file ($cssTemplate): $!\n";
open( STYLESHEET, '>', "$bookPath${templateFilename}" ) or die "Unable to open stylesheet file ($bookPath${templateFilename}) for writing: $!\n";
while( my $templateLine = ) {
while( $templateLine =~ /%%([^%[:space:]]+)%%/ ) {
my $name = $1;
$templateLine =~ s/%%${name}%%/$rulesHash{$name}/g;
}
print STYLESHEET $templateLine;
}
}
close TEMPLATE;
close STYLESHEET;
foreach my $imagePath (split( /:/, $rulesHash{'images'} )) {
unless( -e $imagePath && -d $imagePath ) {
die "Image path ($imagePath) does not exist or is not a directory\n";
}
print qx{$CP $imagePath${FILENAME_SEPARATOR}* $bookPath};
}
#print qx{$TAR cf ${bookCode}.tar ${bookPath}*};
print qx{$ZIP -8 -q ${bookCode}.zip ${bookPath}*};
#print qx{$BZIP2 -9 ${bookCode}.tar};
print qx{$MV ${bookCode}* $bookPath};
}
print "Success\n" if $verbose;