#!/usr/bin/perl

use strict;
use XML::DOM;


my @inline_elsments=('a', 'book-name', 'book-title', 'city', 'code', 'custom-info', 'date',   
'email', 'emphasis', 'first-name', 'genre', 'home-page', 'id', 'isbn', 'image', 'keywords', 'lang', 'last-name', 
'middle-name', 'nickname', 'p', 'part', 'program-used', 'publish-info', 'publisher', 'sequence', 'src-lang', 'src-ocr', 
'src-url', 'strikethrough', 'strong', 'sub', 'subtitle', 'sup', 'text-author', 'title', 'translator', 'v', 'version', 
'year');
my %inline_elements_hash=();

foreach (@inline_elsments)
{
  $inline_elements_hash{$_}=1;
}

my $FileName= $ARGV[0];  
my $parser = new XML::DOM::Parser;  
my $root = $parser->parsefile($FileName)->getDocumentElement();

normalize_branch($root);
print $root->toString();

sub normalize_branch
{
  my $branch = shift;
  my $level = shift;
  foreach ($branch->getChildNodes())
  {
    normalize_text_node($_) if ($_->getNodeType()==TEXT_NODE);
  }
  my @children=$branch->getChildNodes();
  
  if (! $inline_elements_hash{$branch->getNodeName()} )
  {
    foreach my $node (@children)
    {
      my $new_node=$branch->getOwnerDocument()->createTextNode("\n  ".$level);
      $branch->insertBefore ($new_node,$node);
    }
    my $new_node=$branch->getOwnerDocument()->createTextNode("\n".$level);
    $branch->insertBefore ($new_node);
  }
  
  foreach (@children)
  {
    normalize_branch($_,$level."  ") if ($_->getNodeType()== ELEMENT_NODE);
  }
}
  
sub normalize_text_node
{
  my $text_node=shift;
  return 0 if ( $text_node->getNodeType()!=TEXT_NODE );
  my $text=$text_node->getData();
  $text=~s/\s+/ /g;
  $text=~s/^ //g;
  $text=~s/ $//g;
  if ($text eq '')
  {
    $text_node->getParentNode()->removeChild($text_node);
  } else
  {
    $text_node->setData($text);
  }
}
  

