1 files changed, 9 insertions, 3 deletions
diff --git a/lib/sisu/v0/shared_xml.rb b/lib/sisu/v0/shared_xml.rb
index 228a5c14..7ecc52bb 100644
--- a/lib/sisu/v0/shared_xml.rb
+++ b/lib/sisu/v0/shared_xml.rb
@@ -254,6 +254,8 @@ module SiSU_XML_munge
           para.gsub!(/ÿ/u, '&#255;') # '&yuml;'   # &#255;
           para.gsub!(/‘/u, '&#8216;') # '&lsquo;' # &#8216;
           para.gsub!(/’/u, '&#8217;') # '&rsquo;' # &#8217;
+          para.gsub!(/“/u, '&#8220;') # &ldquo;   # &#8220;
+          para.gsub!(/”/u, '&#8221;') # &rdquo;   # &#8221;
           para.gsub!(/–/u, '&#8211;') # &ndash;   # &#8211;
           para.gsub!(/—/u, '&#8212;') # &mdash;   # &#8212;
           para.gsub!(/∝/u, '&#8733;') # &prop;    # &#8733;
@@ -355,6 +357,8 @@ module SiSU_XML_munge
           para.gsub!(/ÿ/u, '&yuml;')      # &#255;
           para.gsub!(/‘/u, '&#lsquo;')    # &lsquo;  # &#8216;
           para.gsub!(/’/u, '&#rsquo;')    # &rsquo;  # &#8217;
+          para.gsub!(/“/u, '&ldquo;')     # &ldquo;   # &#8220;
+          para.gsub!(/”/u, '&rdquo;')     # &rdquo;   # &#8221;
           para.gsub!(/–/u, '&ndash;')     # &ndash;  # &#8211;
           para.gsub!(/—/u, '&mdash;')     # &mdash;  # &#8212;
           para.gsub!(/∝/u, '&prop;')      # &prop;   # &#8733;
@@ -369,11 +373,13 @@ module SiSU_XML_munge
     end
     def tidywords(wordlist)
       wordlist.each do |x|
+        #imperfect solution will not catch all possible cases
         x.gsub!(/&/,'&amp;') unless x =~/&\S+;/
+        x.gsub!(/&([A-Z])/,'&amp;\1')
       end
     end
     def markup(para='')
-      wordlist=para.scan(/\S+|\n/) #\n needed for tables, check though added 2005w17
+      wordlist=para.scan(/&[#0-9a-z]+;|\S+|\n/) #\n needed for tables, check though added 2005w17
       para=tidywords(wordlist).join(' ').strip
       para.gsub!(/#{Mx[:br_line]}|#{Mx[:br_nl]}/,'<br />')
       para.gsub!(/#{Mx[:mk_o]}:name#\S+?#{Mx[:mk_c]}/,'')
@@ -439,7 +445,7 @@ module SiSU_XML_munge
         "<image.path>#{@dir.url.images_local}\/\\1</image.path>")
       para.gsub!(/&nbsp;/,'&#160;')
       #para.gsub!(/&nbsp;/,' ') #clean
-      wordlist=para.scan(/\S+|\n/) #\n needed for tables, check though added 2005w17
+      wordlist=para.scan(/&[#0-9a-z]+;|\S+|\n/) #\n needed for tables, check though added 2005w17
       para=tidywords(wordlist).join(' ').strip
       para
     end
@@ -462,7 +468,7 @@ module SiSU_XML_munge
         "<image.path>#{@dir.url.images_local}\/\\1</image.path>")
       para.gsub!(/&nbsp;/,'&#160;')
       #para.gsub!(/&nbsp;/,' ') #clean
-      wordlist=para.scan(/\S+|\n/) #\n needed for tables, check though added 2005w17
+      wordlist=para.scan(/&[#0-9a-z]+;|\S+|\n/) #\n needed for tables, check though added 2005w17
       para=tidywords(wordlist).join(' ').strip
       para
     end