cleanxml.sh

 

xyz=$1

for i in `find . -name \*.html -print`
do
   echo $i
   sed -e :a -e "/\""'$/N;s/\n/ /;ta' $i | \
   sed -e :a -e "/\" "'$/N;s/\n/ /;ta' | \
   sed -e :a -e "/[a-z]"'$/N;s/\n/ /;ta' | \
   sed "s/\"  /\" /g" | \
   sed "s/\"  /\" /g" | \
   sed "s/\"  /\" /g" | \
   sed "s/\"  /\" /g" | \
   sed "s/\"  /\" /g" | \
   sed "s/\"  /\" /g" | \
   sed "s/\"  /\" /g" | \
   sed "s/\"  /\" /g" | \
   sed "s/\"  /\" /g" | \
   sed "s/\"  /\" /g" | \
   sed "s/\"  /\" /g" | \
   sed "s/\"  /\" /g" | \
   sed "s/\"  /\" /g" | \
   sed "s/\"  /\" /g" | \
   sed "s/\"  /\" /g" | \
   sed "s/\"  /\" /g" | \
   sed "s/\"  /\" /g" > $i.tmp
   mv $i.tmp $i
done