X-Git-Url: http://git.projectaon.org/?a=blobdiff_plain;f=common%2Fscripts%2Fxmlize.pl;h=d78bd94ce7b3e93a59abb9b11b4237373596d854;hb=cff1c4dd5ab679f83b05e4ac86af1e6ea3d8ec1d;hp=5ca73a9285e74a6df037c54a624fab202be2acac;hpb=5b3469ce11c15d79211f803879e03563ec7a0099;p=project-aon.git diff --git a/common/scripts/xmlize.pl b/common/scripts/xmlize.pl index 5ca73a9..d78bd94 100755 --- a/common/scripts/xmlize.pl +++ b/common/scripts/xmlize.pl @@ -8,8 +8,10 @@ use strict; use warnings; use utf8; use open ':encoding(UTF-8)'; +use open ':std', ':encoding(UTF-8)'; my $FILE_EXTENSION = 'txt'; +my $BASE_INDENT = ' '; #### Main Routine @@ -30,7 +32,7 @@ print << "(End of XML Header)"; %general.inclusions; ]> - + [Insert Title] @@ -98,9 +100,9 @@ for( my $sectionNumber = $minSectionNumber; $sectionNumber <= $numberOfSections; } } - print "\n\n
\n $sectionNumber\n\n \n"; + print "\n\n$BASE_INDENT
\n$BASE_INDENT $sectionNumber\n\n$BASE_INDENT \n"; print @newlines; - print " \n
"; + print "$BASE_INDENT
\n$BASE_INDENT
"; } print << "(End of XML footer)"; @@ -120,6 +122,10 @@ print << "(End of XML footer)"; sub xmlize { my( $inline, $infile ) = @_; + if(!defined $inline || $inline eq "") { + return ""; + } + $inline =~ tr/\t/ /; $inline =~ s/[[:space:]]{2,}/ /g; $inline =~ s/[[:space:]]+$//; @@ -129,6 +135,7 @@ sub xmlize { $inline =~ s/\&(?=[[:space:]])//g; $inline =~ tr/\"\`/\'/; $inline =~ s/[\N{U+2018}\N{U+201C}]//g; + $inline =~ s|[\N{U+2019}\N{U+201D}]([[:alpha:]])|$1|g; $inline =~ s/[\N{U+2019}\N{U+201D}]/<\/quote>/g; $inline =~ s/[\N{U+2014}]//g; $inline =~ s/[\N{U+2014}]//g; @@ -138,15 +145,15 @@ sub xmlize { if( $inline =~ /^\*/ ) { # unordered lists - $inline =~ s/^\*\s*/
    \n
  • /; - $inline =~ s/\s*\*\s*/<\/li>\n
  • /g; - $inline .= "
  • \n
"; + $inline =~ s/^\*\s*/$BASE_INDENT
    \n$BASE_INDENT
  • /; + $inline =~ s/\s*\*\s*/<\/li>\n$BASE_INDENT
  • /g; + $inline .= "
  • \n$BASE_INDENT
"; } elsif( $inline =~ /^\d+\)\s/ ) { # ordered lists - $inline =~ s/^\d+\)\s+/
    \n
  1. /; - $inline =~ s/\s*\d+\)\s+/<\/li>\n
  2. /g; - $inline .= "
  3. \n
"; + $inline =~ s/^\d+\)\s+/$BASE_INDENT
    \n$BASE_INDENT
  1. /; + $inline =~ s/\s*\d+\)\s+/<\/li>\n$BASE_INDENT
  2. /g; + $inline .= "
  3. \n$BASE_INDENT
"; } elsif( $inline =~ /^\<\!\-\-\spre\s\-\-\>/ ) { # pre-formatted text @@ -155,21 +162,21 @@ sub xmlize { } elsif( $inline =~ /^.+:\s+CLOSE\sCOMBAT\sSKILL/ ) { # Freeway Warrior combat - $inline =~ s/^(.+):\s+CLOSE\sCOMBAT\sSKILL\s+([0-9]+)\s+ENDURANCE\s+([0-9]+)/ $1<\/enemy>$2<\/enemy-attribute>$3<\/enemy-attribute><\/combat>/g; + $inline =~ s/^(.+):\s+CLOSE\sCOMBAT\sSKILL\s+([0-9]+)\s+ENDURANCE\s+([0-9]+)/$BASE_INDENT $1<\/enemy>$2<\/enemy-attribute>$3<\/enemy-attribute><\/combat>/g; } elsif( $inline =~ /^.+:\s+COMBAT\sSKILL/ ) { # combat - $inline =~ s/^(.+):\s+COMBAT\sSKILL\s+([0-9]+)\s+ENDURANCE\s+([0-9]+)/ $1<\/enemy>$2<\/enemy-attribute>$3<\/enemy-attribute><\/combat>/; + $inline =~ s/^(.+):\s+COMBAT\sSKILL\s+([0-9]+)\s+ENDURANCE\s+([0-9]+)/$BASE_INDENT $1<\/enemy>$2<\/enemy-attribute>$3<\/enemy-attribute><\/combat>/; } elsif( $inline =~ /^(.*)\b(return|turn|go)([a-zA-Z\s]+?to )(\d{1,3})/i ) { # links - $inline =~ s/^(.*)\b(return|turn|go)([a-zA-Z\s]+?to )(\d{1,3})(.*)/ $1$2$3$4<\/link-text>$5<\/choice>/i; + $inline =~ s/^(.*)\b(return|turn|go)([a-zA-Z\s]+?to )(\d{1,3})(.*)/$BASE_INDENT $1$2$3$4<\/link-text>$5<\/choice>/i; $inline =~ s/\s+<\/choice>/<\/choice>/; } elsif( $inline =~ /^\[/ ) { # signposts $inline =~ s/\[(.*)\]/$1/; - $inline = " $inline"; + $inline = "$BASE_INDENT $inline"; $inline =~ s/\s+<\/signpost>/<\/signpost>/; } elsif( $inline =~ /^/ ) { @@ -180,7 +187,7 @@ sub xmlize { # do nothing } else { - $inline = "

$inline

"; + $inline = "$BASE_INDENT

$inline

"; } # Interferes with selecting a combat paragraph if done earlier