aboutsummaryrefslogtreecommitdiffhomepage
path: root/data/sisu/v4/conf/convert
diff options
context:
space:
mode:
Diffstat (limited to 'data/sisu/v4/conf/convert')
-rw-r--r--data/sisu/v4/conf/convert/kdissert_to_sisu161
-rw-r--r--data/sisu/v4/conf/convert/modify.rb376
-rw-r--r--data/sisu/v4/conf/convert/sisu_convert519
-rw-r--r--data/sisu/v4/conf/convert/wvHtml.xml388
-rw-r--r--data/sisu/v4/conf/convert/wvSiSU.xml360
5 files changed, 0 insertions, 1804 deletions
diff --git a/data/sisu/v4/conf/convert/kdissert_to_sisu b/data/sisu/v4/conf/convert/kdissert_to_sisu
deleted file mode 100644
index 35921c3e..00000000
--- a/data/sisu/v4/conf/convert/kdissert_to_sisu
+++ /dev/null
@@ -1,161 +0,0 @@
-#!/usr/bin/env ruby
-=begin
- * Name: modify.rb
- * Author: Ralph Amissah
- * http://www.jus.uio.no/sisu
- * http://www.jus.uio.no/sisu/SiSU/download
- * Description: Conversion script from kdissert .kdi to sisu markup .sst
- * Copyright (C) 2004, 2006 Ralph Amissah
- * Packaged with: SiSU information Structuring Universe -
- Structured information, Serialized Units
- * SiSU Copyright (C) 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006 Ralph Amissah
-
- * License: GPL 3 or later
-
- Summary of GPL 3
-
- This program is free software; you can redistribute it and/or modify it
- under the terms of the GNU General Public License as published by the Free
- Software Foundation; either version 3 of the License, or (at your option)
- any later version.
-
- This program is distributed in the hope that it will be useful, but WITHOUT
- ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
- FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
- more details.
-
- You should have received a copy of the GNU General Public License along
- with this program; if not, write to the Free Software Foundation, Inc.,
- 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA
-
- If you have Internet connection, the latest version of the GPL should be
- available at these locations:
- http://www.fsf.org/licenses/gpl.html
- http://www.gnu.org/copyleft/gpl.html
- http://www.jus.uio.no/sisu/gpl3.fsf
-
- © Ralph Amissah 1997, current 2006.
- All Rights Reserved.
-
- * Ralph Amissah: ralph@amissah.com
- ralph.amissah@gmail.com
-=end
-require 'rexml/document'
-include REXML
-argv=$*
-@sisu,@sisu_base=Array.new,Array.new
-unless argv.empty?
- argv.each do |kdi|
- if kdi =~/\.kdi$/
- system("cp #{kdi} #{kdi}.tar.gz && tar xzvf #{kdi}.tar.gz && rm #{kdi}.tar.gz")
- file=File.new("maindoc.xml")
- #system("cp #{kdi} /tmp/. && cd /tmp && tar xzvf /tmp/#{kdi} && cd -")
- #file=File.new("/tmp/maindoc.xml")
- @output=File.new("#{kdi}.sst",'w')
- doc=Document.new(file)
- root=doc.root
- @el=Array.new
- root.each do |x|
- end
- root.each_with_index do |content,idx|
- if root.elements["item[#{idx}]/summary"]
- id,ma,ch=nil,nil,Array.new
- if root.elements["item[#{idx}]/id"]
- id=root.elements["item[#{idx}]/id"].text.to_i
- end
- if root.elements["item[#{idx}]/parent"]
- ma=root.elements["item[#{idx}]/parent"].text.to_s
- end
- if root.elements["item[#{idx}]/child"] #problem only get one child, even where several
- root.get_elements("item[#{idx}]/child").each do |x|
- ch << x.text
- end
- end
- if root.elements["item[#{idx}]/summary"]
- sum=root.elements["item[#{idx}]/summary"].text.to_s.strip
- end
- if root.elements["item[#{idx}]/text"]
- txt=root.elements["item[#{idx}]/text"].text.to_s.strip
- end
- @el[id]=Hash.new
- @el[id][:id]=id
- @el[id][:ma]=ma
- @el[id][:ch]=ch
- @el[id][:sum]=sum
- @el[id][:txt]=txt
- if ma == '-1'
- @el[id][:lev]=':A'
- @top=id
- end
- end
- end
- @doc=Array.new
- @title=@el[@top][:sum]
- p @el[@top][:sum]
- @doc << ':A~ ' + @el[@top][:sum]
- @el[@top][:ch].each do |x|
- @el[x.to_i][:lev]='1'
- @doc << '1~ ' + @el[x.to_i][:sum]
- @doc << @el[x.to_i][:txt]
- @el[x.to_i][:ch].each do |y|
- @el[y.to_i][:lev]='2'
- @doc << '2~ ' + @el[y.to_i][:sum]
- @doc << @el[y.to_i][:txt]
- @el[y.to_i][:ch].each do |z|
- @el[z.to_i][:lev]='3'
- @doc << '3~ ' + @el[z.to_i][:sum]
- @doc << @el[z.to_i][:txt]
- @el[z.to_i][:ch].each do |za| #unsupported... consder
- @el[za.to_i][:lev]='4'
- @doc << '!_ ' + @el[za.to_i][:sum]
- @doc << @el[za.to_i][:txt]
- end
- end
- end
- end
- #@el.each_with_index do |x,i|
- # if x: puts "#{i}: lev: #{x[:lev]}, id: #{x[:id]}, ma: #{x[:ma]}, ch: #{x[:ch].join(',')}"
- # end
- #end
-# regexs strip most kdissert markup, and provide minimal info for sisu markup -->
- @doc.each do |c,idx|
- c.gsub!(/<\/summary>/,'')
- c.gsub!(/<html>.+?\n|<\/body>|<\/html>|<p>/m,'')
- c.gsub!(/<\/p>/,"\n")
- c.gsub!(/<span style="font-weight:600">(.+?)<\/span>/," *{ \\1 }* ")
- c.gsub!(/<span style="text-decoration:underline">(.+?)<\/span>/," _{ \\1 }_ ")
- c.gsub!(/<span style="font-style:italic">(.+?)<\/span>/," /{ \\1 }/ ")
- c.gsub!(/<ul type="disc">/,'_* ')
- c.gsub!(/<\S+?>/,'')
- c.gsub!(/&lt;(:p[bn])&gt;/,"<\\1>")
- c.gsub!(/&lt;&lt;(|.?|@|.?|)/,"<<\\1")
- c.gsub!(/&quot;/,'"')
- c.gsub!(/ \s+/,' ')
- @sisu_base << c.strip + "\n\n"
- end
- else puts ".kdi extension expected, filename not recognised: << #{kdi} >>"
- end
- end
-else puts '.kdi file for conversion to sisu expected'
-end
-sisu_head=<<WOK
-% converted from Kdissert to SiSU
-
-@title: #@title
-
-@prefix: Kdissert mind/topic mapping auto conversion to SiSU markup
-
-@links: {Kdissert}http://freehackers.org/~tnagy/kdissert/
-
-@base_program: kdissert
-
-% @date:
-
-@rcs: $Id$
-
-@level: num_top=1
-
-WOK
-#puts @sisu_base
-@output << sisu_head << @sisu_base
-__END__
diff --git a/data/sisu/v4/conf/convert/modify.rb b/data/sisu/v4/conf/convert/modify.rb
deleted file mode 100644
index 8a4b9074..00000000
--- a/data/sisu/v4/conf/convert/modify.rb
+++ /dev/null
@@ -1,376 +0,0 @@
-#!/usr/bin/env ruby
-# encoding: utf-8
-=begin
-
- * Name: modify.rb
-
- * Description: A conversion script for canned substitutions,
- a fairly generic simple tool that can be used to store other canned conversions,
- (used here for altering SiSU markup or the SiSU program)
-
- * Author: Ralph Amissah
-
- * Copyright: (C) 1997 - 2012, Ralph Amissah, All Rights Reserved.
-
- * License: GPL 3 or later:
-
- * Packaged with: SiSU a framework for document structuring, publishing & search
-
- Copyright (C) Ralph Amissah
-
- This program is free software: you can redistribute it and/or modify it
- under the terms of the GNU General Public License as published by the Free
- Software Foundation, either version 3 of the License, or (at your option)
- any later version.
-
- This program is distributed in the hope that it will be useful, but WITHOUT
- ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
- FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
- more details.
-
- You should have received a copy of the GNU General Public License along with
- this program. If not, see <http://www.gnu.org/licenses/>.
-
- If you have Internet connection, the latest version of the GPL should be
- available at these locations:
- <http://www.fsf.org/licensing/licenses/gpl.html>
- <http://www.gnu.org/licenses/gpl.html>
-
- <http://www.jus.uio.no/sisu/gpl.fsf/toc.html>
- <http://www.jus.uio.no/sisu/gpl.fsf/doc.html>
- <http://www.jus.uio.no/sisu/gpl.fsf/plain.txt>
-
- * Hompages:
- <http://www.jus.uio.no/sisu>
- <http://www.sisudoc.org>
-
- * Download:
- <http://www.jus.uio.no/sisu/SiSU/download.html>
-
- * Ralph Amissah
- <ralph@amissah.com>
- <ralph.amissah@gmail.com>
-
-=end
-module SiSU_Modify
- class Operations
- def initialize(cf,files)
- @cf,@files=cf,files
- @description="This is a script that contains canned text conversions for reuse"
- pwd=Dir.pwd
- @mod_inst='modify_instructions.rb'
- @modify_instructions_script="#{pwd}/#{@mod_inst}"
- if FileTest.file?(@modify_instructions_script) ==true
- puts <<-WOK
- autoload script: "#{@modify_instructions_script}"
- used by "ruby #{__FILE__} --convert" if
- "Extracted.new.modify.modules_and_classes" is used
- (see "matches_and_replaces")
- EDIT this file manually
- [to rebuild run: "ruby #{__FILE__} --build-gsub"]
-
- WOK
- else
- puts <<-WOK
- autoload script does not exist: "#{@modify_instructions_script}"
- needed for "ruby #{__FILE__} --convert" if
- "Extracted.new.modify.modules_and_classes" is used
- (see "matches_and_replaces")
- try run: "ruby #{__FILE__} --build-gsub"
-
- WOK
- end
- autoload :Extracted, "./#{@mod_inst}"
- end
- def matches_and_replaces #edit manually
- [
- #Extracted.new.modify.modules_and_classes,
- #Extracted.new.modify.modules,
- #Extracted.new.modify.classes,
- #modify.dates,
- #modify.modules,
- #modify.classes,
- #modify.misc,
- ]
- end
- def message(text)
- response=''
- while response !~/yes/
- print %{
- #{text}
- To continue type "yes" [to exit type "no" or "quit"]: }
- response=File.new('/dev/tty').gets.strip
- exit if response =~/^(?:quit|no)$/
- end
- end
- def help
- print <<WOK
-
-#{@description}
-
-note converting twice in a single direction will result
-in markup inconsistency
-
-modify.rb --convert
- performs the current conversion that is set in method "matches_and_replaces",
- this needs to be edited manually, as do the substitutions to be made on the
- files matched in the settings [handle with care]
-
-modify.rb --report
- reports on the names of modules and classes in each file requested
- (the defalt is all)
-
-modify.rb --build-gsub
- creates modify_instructions.rb methods for substitutions of methods and
- classes for editing
-
-WOK
- exit
- end
- #%% substitutions to be made
- # [//, ''],
- #def rename_default
- # message(%q{rename SiSU modules, classes, date})
- # [
- # [/1997\s+-\s+2012/, '1997 - 2012'],
- # ]
- #end
- def modify
- def misc
- [
- #[//, ''],
- ]
- end
- def dates
- [
- [/1997\s+-\s+2011/, '1997 - 2012'],
- ]
- end
- def modules
- [
- #[//, ''],
- ]
- end
- def classes
- [
- #[//, ''],
- ]
- end
- self
- end
- def convert
- message("WARNING, proceed at your own risk,\npermanent changes requested for the above named files\n best that you check (manually) what this file is set to do\n conversions set are at the top of the file")
- if matches_and_replaces.length > 0
- @files.each do |i|
- @new,@matched,@empty1,@empty2=true,false,false,false
- file=File.open(i,'r')
- cont=file.readlines
- file.close
- @file=File.new(i,'w')
- cont.each do |t|
- matches_and_replaces.each do |match_and_replace|
- match_and_replace.each do |m,r|
- if t =~m
- p m.to_s + ' -> ' + r
- puts "in: #{t}"
- t=t.gsub(m,r) if m and r
- puts "out: #{t}"
- end
- end
- end
- if t=~/^\s*$/; @empty1=true
- else @empty1=false
- end
- @file.puts t unless (@empty1==true and @empty2==true)
- if t=~/^\s*$/; @empty2=true
- else @empty2=false
- end
- end
- @file.close
- end
- end
- end
- def report_modules_and_classes
- @f=nil
- @structure={}
- @arr={mod: [], cl: []}
- @files.each do |f|
- @new,@matched,@empty1,@empty2=true,false,false,false
- file=File.open(f,'r')
- cont=file.readlines
- file.close
- cont.each do |t|
- if f != @f
- @f=f
- @mod=nil
- #puts "---\n#{@f}"
- @structure[@f]={}
- end
- if t =~/^\s*module\s+\S+/
- @mod=t.match(/^\s*module\s+(\S+)/)[1]
- #puts ' ' + @mod
- @arr[:mod] << @mod
- @structure[@f].store(@mod,[])
- #@structure[@f] = {@mod => []}
- end
- if t =~/^\s*class\s+\S+/
- cl=t.match(/^\s*class\s+(\S+)/)[1]
- #puts ' ' + cl
- @arr[:cl] << cl
- @structure[@f][@mod] << cl
- end
- end
- end
- @structure.sort.each do |fl,modules|
- puts "---\n" + fl
- modules.sort.each do |mod,classes|
- puts ' ' + mod
- classes.sort.each do |cl|
- puts ' ' + cl
- end
- end
- end
- puts '---'
- puts 'number of modules: ' + @arr[:mod].length.to_s + ', unique: ' + @arr[:mod].uniq.length.to_s
- puts 'number of classes: ' + @arr[:cl].length.to_s + ', unique: ' + @arr[:cl].uniq.length.to_s
- end
- def build_search_and_replace_method_for_modules_and_classes
- @f=nil
- @structure={}
- @arr={mod: [], cl: []}
- @files.each do |f|
- @new,@matched,@empty1,@empty2=true,false,false,false
- file=File.open(f,'r')
- cont=file.readlines
- file.close
- cont.each do |t|
- if f != @f
- @f=f
- @mod=nil
- #puts "---\n#{@f}"
- @structure[@f]={}
- end
- if t =~/^\s*module\s+\S+/
- @mod=t.match(/^\s*module\s+(\S+)/)[1]
- #puts ' ' + @mod
- @arr[:mod] << @mod
- @structure[@f].store(@mod,[])
- #@structure[@f] = {@mod => []}
- end
- if t =~/^\s*class\s+\S+/
- cl=t.match(/^\s*class\s+(\S+)/)[1]
- #puts ' ' + cl
- @arr[:cl] << cl
- @structure[@f][@mod] << cl
- end
- end
- end
- puts 'number of modules: ' + @arr[:mod].length.to_s + ', unique: ' + @arr[:mod].uniq.length.to_s
- puts 'number of classes: ' + @arr[:cl].length.to_s + ', unique: ' + @arr[:cl].uniq.length.to_s
- method_modules_and_classes=[]
- method_modules_and_classes <<<<-WOK
-#module SiSU_MC
- class Extracted
- def modify
- WOK
- #% modules_and_classes
- method_modules_and_classes <<<<-WOK
- def modules_and_classes
- [
- WOK
- @structure.sort.each do |fl,modules|
- method_modules_and_classes << ' '*8 + "##% -- " + fl
- modules.sort.each do |mod,classes|
- method_modules_and_classes << ' '*8 + '# ' + "[/#{mod}/," + ' '*(67 - mod.length) + "'#{mod}'],"
- classes.uniq.sort.each do |cl|
- method_modules_and_classes << ' '*8 + '# ' + "[/#{cl}/," + ' '*(65 - cl.length) + "'#{cl}'],"
- end
- end
- end
- method_modules_and_classes <<<<-WOK
- ]
- end
- WOK
- #% modules
- method_modules_and_classes <<<<-WOK
- def modules
- [
- WOK
- method_modules_and_classes << ' '*8 + '# ' + 'number of modules: ' + @arr[:mod].length.to_s +
- ', unique: ' + @arr[:mod].uniq.length.to_s
- @arr[:mod].uniq.sort.each do |mod|
- method_modules_and_classes << ' '*8 + '# ' + "[/#{mod}/," + ' '*(67 - mod.length) + "'#{mod}'],"
- end
- method_modules_and_classes <<<<-WOK
- ]
- end
- WOK
- #% classes
- method_modules_and_classes <<<<-WOK
- def classes
- [
- WOK
- method_modules_and_classes << ' '*8 + '# ' + 'number of classes: ' + @arr[:cl].length.to_s +
- ', unique: ' + @arr[:cl].uniq.length.to_s
- @arr[:cl].uniq.sort.each do |cl|
- method_modules_and_classes << ' '*8 + '# ' + "[/#{cl}/," + ' '*(67 - cl.length) + "'#{cl}'],"
- end
- method_modules_and_classes <<<<-WOK
- ]
- end
- WOK
- method_modules_and_classes <<<<-WOK
- self
- end
- end
-#end
- WOK
- #method_modules_and_classes.each{|x| puts x}
- if FileTest.file?(@modify_instructions_script) ==true
- message("WARNING << #{@mod_inst} >> exists (and may have been edited). The existing << #{@mod_inst} >> will be overwritten if you proceed.")
- end
- instructs=File.new(@modify_instructions_script,'w')
- method_modules_and_classes.each do |x|
- puts x
- instructs.puts x
- end
- instructs.close
- end
- def action
- if @files and @files.length > 0
- p @files
- mr=nil
- #%% changes to make m match, r replace -------------------------->
- if @cf =~/--help/; help
- else
- case @cf
- when /--convert/; convert
- when /--report/; report_modules_and_classes
- when /--build-gsub/; build_search_and_replace_method_for_modules_and_classes
- else help
- end
- #act
- end
- else puts "this routine makes permanent changes to the contents of the files matched, as instructed within [no matches]"
- end
- end
- end
-end
-#% files to match for this conversion set ------------------------->
-f=$* #; p $*
-cf=f[0].to_s
-f.shift
-match_and_replace=Array.new
-unless f.length > 0
- f=if cf == '--report' \
- or cf == '--build-gsub'
- Dir.glob("[a-zA-Z]*.rb") #restrict to ruby files
- else
- Dir.glob("[a-zA-Z]*")
- end
- f=f.sort.delete_if { |x| x == __FILE__ or x == 'modify_instructions.rb' }
-end
-SiSU_Modify::Operations.new(cf,f).action
-__END__
-#f=Dir.glob("{bin,conf,data,lib}/**/*.rb") #sisu development
-#f=Dir.glob("[^_]/**/*") #all files subdirectories beneath pwd except those starting with _
diff --git a/data/sisu/v4/conf/convert/sisu_convert b/data/sisu/v4/conf/convert/sisu_convert
deleted file mode 100644
index a3a12189..00000000
--- a/data/sisu/v4/conf/convert/sisu_convert
+++ /dev/null
@@ -1,519 +0,0 @@
-#!/usr/bin/env ruby
-# = sisu - SiSU information Structuring Universe
-#
-# Copyright (c) Ralph Amissah 1997,2004
-#
-# Ralph Amissah mailto:ralph@amissah.com
-#
-# * Name: SiSU information Structuring Universe
-# * Author: Ralph@Amissah.com
-# * Description: document conversion tool, to sisu from other formats
-# * License: GPL 3 or later
-# * Notes: word conversion uses wvWare and wvSiSU.xml (a modified/stripped wvHtml.xml)
-# * http://wvware.sourceforge.net/
-# * http://sourceforge.net/projects/wvware
-# * <url:sisu.lnk>|sisu.lnk|@|^|
-# * <url:sisu>
-module CONVERT
- class MyOutput
- def initialize(data, filename, instruct)
- @data=data.compact
- @filename=filename
- @instruct=instruct
- end
- def headerBasic
- <<WOK
-% SiSU 2.0
-
-@title:
- :subtitle:
-
-@creator:
- :author:
-
-@classify:
- :topic_register:
-
-@date:
- :published:
-
-@rights:
- :copyright:
- :license:
-
-WOK
- end
- def headerDefault
- <<WOK
-% SiSU 2.0
-
-@title:
- :subtitle:
-
-@creator:
- :author:
-
-@classify:
- :topic_register:
-
-@date:
- :published:
-
-@rights:
- :copyright:
- :license:
-
-WOK
- end
- def hardOutput
- pre = Array.new
- case @instruct
- when /default/
- pre << headerDefault
- else
- pre << headerBasic
- end
- @filename_wv=File.new(%{,,#{@filename}.sst},'w+')
- @filename_wv << pre
- @data.each do |x|
- y = x.split("\n")
- y.each do |z| # cleaner output this way
- z.strip!
- @filename_wv.puts "#{z}\n\n" unless z =~/^$/
- end
- end
- end
- end
- class WareWord97
- def initialize(data, filename, instruct)
- @data=data
- @filename=filename
- @instruct=instruct
- end
- def songsheet
- data=@data
- print "Convert to SiSU file from Word97 << gvim ,,#{@filename}.sst >\n" #: <<#{@@html_title}>>
- data=WareWord97.new(data.collect,@filename,@instruct).strip
- data=WareWord97.new(data.collect,@filename,@instruct).strip
- data=WareWord97.new(data.collect,@filename,@instruct).markup_rules
- data=MyOutput.new(data.collect,@filename,@instruct).hardOutput
- end
- def strip
- data=@data
- tuned_file=Array.new
- endnote_no=1
- data.each do |para|
- para.strip!
- para.gsub!(/<u>\s*<\/u>/,'')
- para.gsub!(/<\/u>\s*<u>/,'')
- para.gsub!(/<b>\s*<\/b>/,'')
- para.gsub!(/<\/b>\s*<b>/,'')
- para.gsub!(/<i>\s*<\/i>/,'')
- para.gsub!(/<\/i>\s*<i>/,'')
- tuned_file << para unless para == nil
- end
- tuned_file
- end
- def markup_rules
- data=@data
- tuned_file=Array.new
- endnote_no=1
- data.each do |para|
- para.strip!
- para.gsub!(/\s+/,' ')
- para.gsub!(/^<b>(Chapter|Article)(.+?)<\/b>/i,'1~ \1 \2') #watch case insensitivity
- para.gsub!(/^<b>(Part|Section|Book)(.+?)<\/b>/i,':C~ \1 \2') #watch case insensitivity
- para.gsub!(/^<b>(\d+\.\d+\.\d+\.?)(.+?)<\/b>/i,'3~ \1 \2') #numeric, decide what to do, can be different
- para.gsub!(/^<b>(\d+\.\d+\.?)(.+?)<\/b>/i,'2~ \1 \2') #numeric, decide what to do, can be different
- para.gsub!(/^<b>(\d.+?)<\/b>/i,'4~ \1 \2') #numeric, decide what to do, can be different
- #para.gsub!(/^<b>([\d.]+?)<\/b>/i,'4~ \1 \2') #numeric, decide what to do, can be different
- para.gsub!(/<u>(.+?)<\/u>/,'_{\1}_')
- para.gsub!(/<b>(.+?)<\/b>/,'!{\1}!')
- para.gsub!(/<i>(.+?)<\/i>/,'/{\1}/')
- tuned_file << para unless para == nil
- end
- tuned_file
- end
- end
- class Html
- def initialize(data, filename, instruct)
- @data=data
- @filename=filename
- @instruct=instruct
- end
- def songsheet
- data=@data
- print "Convert to SiSU file from #{@filename}.html << gvim ,,#{@filename}.sst >\n" #: <<#{@@html_title}>>
- #data=Html.new(data.collect, @filename, @instruct).space_paragraphs
- #data=Html.new(data.split(''), @filename, @instruct).space_paragraphs
- data=Html.new(data.join.split(/\n\n+/), @filename, @instruct).space_paragraphs
- #data=Html.new(data.split("\n"), @filename, @instruct).space_paragraphs
- #data=Html.new(data.collect.join.split("\n"), @filename, @instruct).space_paragraphs
- data=Html.new(data.collect, @filename, @instruct).multiline
- data=Html.new(data.collect.join.split("\n\n"), @filename, @instruct).markup_rules
- data=MyOutput.new(data.collect, @filename, @instruct).hardOutput
- end
- def space_paragraphs
- #data=@data.join.split(/\n/)
- data=@data
- #p data.length
- tuned_file=Array.new
- data.each do |para|
- para.strip!
- para.gsub!(/\r/,'')
- #para.gsub!(/\n/, ' ') #PROBLEM, serious time issues on a few files also for \n (or multiline matches which is less surprising), edit out if necessary
- para.gsub!(/<\/?p>/i,'zZz')
- para.gsub!(/<\/?\s*p(?:\s+ALIGN=.+?)?>/i,'zZz') #all manner of <p> para.gsub!(/<\/?p>/i, "\n\n")
- para.gsub!(/<p\s+(class|align).+?>/i,'zZz') #
- para.gsub!(/<\/p>/i,'zZz') # repeat actually
- para.gsub!(/<(?:dir|tr|br)>/i,'zZz') #
- #para.gsub!(/<(?:\/\s*)?(?:dir|tr|br)>/i, "zZz") #
- para.gsub!(/(<\/center>)/i,'\1zZz')
- para.gsub!(/(<\/h[1-6]>)/i,'\1zZz')
- para.gsub!(/ \s+/i,' ')
- para.gsub!(/(?:\s*zZz\s*)+/i,'zZz') #
- tuned_file << para unless para == nil
- end
- tuned_file
- end
- def blockquotes(sub='') # SERIOUS PROBLEM INTRODUCED, some blockquotes go missing !, quite unacceptable, debug, for now not used
- res=Array.new
- sub.each do |x|
- if x=~/(<\/blockquote>)/i
- m = $1
- res << x[/(.+?)#{m}/mi,1].gsub!(/zZz/,'zZz_1 ') if x =~/.+?#{m}/mi
- res << x[/#{m}(.+)/mi,1]
- else
- res << x #[/(.+)/mi,1]
- end
- end
- res.join
- end
- def multiline
- data=@data
- tuned_file=Array.new
- data.each do |para|
- para.gsub!(/\n/,' ')
- para.gsub!(/ \s+/mi,' ')
- #ALL HERE could be very time EXPENSIVE but tamed? compromise ... /mi
- para.gsub!(/<([biu]|h[1-6])>(?:zZz)?([^<]+)?zZz(.+?)<\/\1>/i,'zZz<\1>\2 \3</\1>')
- para.gsub!(/<([biu]|h[1-6])>(?:<center>|zZz)+(.+?)(?:<\/center>)?zZz(.+?)?<\/\1>/i,'zZz<\1>\2 \3</\1>')
- #para.gsub!(/<([biu]|h[1-6])>(?:<center>|zZz)+(.+?)<\/center>zZz(.+?)?<\/\1>/i,'zZz<\1>\2 \3</\1>')
- para.gsub!(/<([biu]|h[1-6])>(?:<center>|zZz)+(.+?)<\/\1>/i,'zZz<\1>\2</\1>')
- para.gsub!(/<(h[1-6])>(.+?)(?:<center>|zZz)+<\/\1>/i,'zZz<\1>\2</\1>zZz') #does catch some h1, h2 etc, too expensive to have biu
- #para.gsub!(/<([biu]|h[1-6])>(.+?)(?:<center>|zZz)+<\/\1>/i,'zZz<\1>\2 \3</\1>') #may go too far? useful for h1 h2 etc, remove biu?
- #para.gsub!(/<([biu]|h[1-6])>([^<]+)?zZz(.+?)<\/\1>/i,'zZz<\1>\2 \3</\1>')
- #para.gsub!(/<([biu]|h[1-6])>([^<]+)?zZz(.+?)<\/\1>/i,'zZz<\1>\2 \3</\1>')
- ### SERIOUS PROBLEM INTRODUCED
- # sub = para.split(/<blockquote>/i)
- # para = blockquotes(sub) if sub.length > 0 #check was on >1 could have serious repercussions 2004w29
- para.gsub!(/zZz(\s*zZz)*/,"\n\n")
- tuned_file << para << "\n\n" unless para == nil
- end
- tuned_file
- end
- def markup_rules
- @@flag_blockquote=false
- data=@data
- tuned_file=Array.new
- data.each do |para|
- if para=~/<a href="(http:\/\/.+?)">/i
- #p para.grep(/<a href="(http:\/\/.+?)">/i)
- #m=$1
- #para.gsub!(/(?:&lt;\s*)?<a href="#{m}">#{m}<\/a>(?:\s*&gt;)?\.?/i, "#{m}")
- para.gsub!(/(?:&lt;\s*)?<a href="(http:\/\/.+?)">http:\/\/.+?<\/a>(?:\s*&gt;)?\.?/i,'\1') #risk that url & url are not to match
- #para.gsub!(/(?:&lt;\s*)?<a href="(\w+\.html)">(http:\/\/.+?\/\1)<\/a>(?:\s*&gt;)?\.?/i, "\\2") #does not match
- end
- if para=~/<BLOCKQUOTE>/i
- @@flag_blockquote=true
- end
- if @@flag_blockquote
- para.gsub!(/^/,'_1 ') unless para.empty? or para =~/^\s*<\/?blockquote?>\s*$/i
- end
- if para=~/<\/BLOCKQUOTE>/i
- @@flag_blockquote=false
- end
- para.gsub!(/<\/?blockquote?>/i,'')
- ### clean
- para.gsub!(/^\s+/i,'')
- para.gsub!(/<([bui]|em|su[pb])>\s*<\/\1>/i,'')
- para.gsub!(/<\/?center>/i,'')
- para.gsub!(/\s*<\/dir>/i,'')
- para.gsub!(/<hr>/i,'')
- para.gsub!(/\s*<a href=".+?\.html#(?:[a-z_]+)?(?:[a-z0-9_-]|\*)+">\[(\*+)\]<\/a>/i,'^{[\1]}^ ') #other endnote marker
- para.gsub!(/<a href=".+?\.html#(?:[a-z_$]+)?[0-9_-]+"(?:\s+name=".+?")?>\[[a-z]?\d+\](?:<\/[bi]>)?<\/a>/i,'~^ ') #endnote marker
- para.gsub!(/<a name=".+?"\s+href=".+?\.html#(?:[a-z_$]+)?[0-9_-]+"?>\[[a-z]?\d+\](?:<\/[bi]>)?<\/a>/i,'~^ ') #endnote marker
- para.gsub!(/<a name="(?:[a-z$]+)?[0-9_-]+">\s*(<\/a>)?\s*\d+\.?\s*(<\/a>)?\s*/i,'^~ ') #endnote
- #para.gsub!(/<h([1-6])>\s*(.+?)\s*<\/h\1>\s*/i,'\1~ \2') #
- para.gsub!(/<h([1-6])(?: align=.+?)?>\s*(.+?)\s*<\/h\1>\s*/i,'\1~ \2') #
- para.gsub!(/^<b>(Chapter|Article)(.+?)<\/b>/i,'4~ \1 \2') #watch case insensitivity
- para.gsub!(/^<b>(Part|Section|Book)(.+?)<\/b>/i,'3~ \1 \2') #watch case insensitivity
- para.gsub!(/^<b>(\d+\.\d+\.\d+\.?)(.+?)<\/b>/i,'6~ \1 \2') #numeric, decide what to do, can be different
- para.gsub!(/^<b>(\d+\.\d+\.?)(.+?)<\/b>/i,'5~ \1 \2') #numeric, decide what to do, can be different
- para.gsub!(/^<b>(\d+\.?)(.+?)<\/b>/i,'4~ \1 \2') #numeric, decide what to do, can be different
- #<a name="ii"></a><B>
- para.gsub!(/^(<a name=".+?">)(?:<small>)?<(?:b|strong)>\s*(.+?)\s*<\/(?:b|strong)>/i,'5~ \2 \1') #watch
- para.gsub!(/^(<(a name|A NAME)=".+?">)(\s*|<\/[aA]>)?([A-Z][A-Z])+/,'5~ \2 \1') #watch
- para.gsub!(/^(\s+|<p>)?(<a name=".+?">)(\s*|<\/a>)?<b>/i,'5~ \2 \1') #watch
- para.gsub!(/<h([1-6])>\s*(.+?)\s*<\/h\1>\s*/i,'\1~ \2') #
- para.gsub!(/^<b>\s*(.+?)<\/b>\s*(<\/i>\s*)?$/i,'4~ \1\2') # wish it all were less messy
- para.gsub!(/^<i>\s*([^"(].+?)<\/i>\s*(<\/b>\s*)?$/i,'5~ \1\2') # wish it all were less messy
- para.gsub!(/<\/?[biu]>/i,'') if para =~/[1-6]\{/
- para.gsub!(/<u>\s*(.+?)\s*<\/u>/i,'_{\1}_')
- para.gsub!(/<(b|strong)>\s*(.+?)\s*<\/\1>/i,'*{\2}*')
- para.gsub!(/<(i|em)>\s*(.+?)\s*<\/\1>/i,'/{\2}/')
- para.gsub!(/<sup>\s*(.+?)\s*<\/sup>/i,'^{\1}^')
- para.gsub!(/(([\/\*!_])\{.+?\}\2)\s\s+/i,'\1 ')
- para.gsub!(/(([\/\*!_])\{.+?\}\2)\s+([.,;?\)])\s+/i,'\1\3 ')
- para.gsub!(/(([\/\*!_])\{.+?\}\2)(["'])\s+/i,'\1\3 ')
- para.gsub!(/(([\/\*!_])\{.+?\}\2)\s*([a-z0-9])/i,'\1 \3')
- para.gsub!(/(([\/\*_])\{.+?\}\2)\s*([a-z0-9])/i,'\1 \3')
- para.gsub!(/([a-z0-9])(([\/\*_])\{.+?\}\3)/i,' \1 \2') #eg this/{problem}/
- para.gsub!(/([\/\*_])\{([,.;; ]+)\}\1/i,'\2') #eg /{,}/ or *{ }* etc.
- para.gsub!(/ \s+/i,' ')
- #para.gsub!(/\/\{\*\{/i, '*{/{')
- #para.gsub!(/\}\*\}\//i, '}/}*')
- para.gsub!(/&quot;/i,'"')
- para.gsub!(/&amp;/i,'and')
- para.gsub!(/<!doctype html public .+/i,'')
- para.gsub!(/<\/?(?:html|head|body|font|small)>/i,'')
- para.gsub!(/<\/(?:title)>/i,'')
- para.gsub!(/<title>/i,'#{~title? ')
- para.gsub!(/<blockquote>(.+?)<\/blockquote>/mi,"\n\n_1 \\1\n\n")
- para.gsub!(/<div align=.+?>|<\/div>|<font size=.+?>|<\/a><\/em><\/strong>/i,'')
- para.gsub!(/~^\s+\.\s*/i,'.~^ ') #check vim equiv # %s/\~e\s\+\.\s*/.\~e /c
- para.gsub!(/\s+~^\s+/i,'~^ ')
- para.gsub!(/ \s+/i,' ')
- para.gsub!(/\s+$/i,'')
- para.gsub!(/^(?:<\/[bi]>)+$/i,'')
- para.gsub!(/^(?:(?:<i>)+<b>|(?:<b>)+<i>)\s*([^"(].+?)/i,'5~ \1\2') # wish it all were less messy
- para.gsub!(/^(?:<\/?(?:[ib]|em)>\s*)+$/i,'') # cleaning up left over <i> etc.
- para.gsub!(/<(?:i|em)>\s*(.+)/i,'/{\1}/') # using up left over <i>
- para.gsub!(/<b>\s*(.+)/i,'*{\1}*') # using up left over <b>
- para.gsub!(/<dd>([\d.]+)/i,'5~ \1')
- para.gsub!(/<dd>(?:&nbsp;)+([\d.]+)/i,'6~ \1')
- para.gsub!(/<dd>(\([a-z]\))/i,'7~ \1')
- para.gsub!(/^([1-9]~)( .+?)<a name="(\S+?)">(.+?)(<\/a>)/i,'\1\3\2\4')
- para.gsub!(/^([1-9]~)( .+?)<a name="(\S+?)">/i,'\1\3\2')
- para.gsub!(/http\/\/(\S+)/i,'http:\/\/\1')
- para.gsub!(/\s*<a href="\S+?">(http:\/\/\S+?)<\/a>\s*/i,' \1 ')
- para.gsub!(/([a-zA-Z.,!?;:])([*\/_-]\{)/,'\1 \2')
- para.gsub!(/^\s*(&nbsp;){10,12}/i,'_2 ')
- para.gsub!(/^\s*(&nbsp;){4,5}/i,'_1 ')
- para.gsub!(/&#9;/,' ') #check
- ## glyphs & tildes
- para.gsub!(/&iexcl;/, '¡') #'Inverted exclamation
- para.gsub!(/&cent;/, '¢') #'Cent sign ¢
- para.gsub!(/&pound;/, '£') #'Pound sign £
- para.gsub!(/&curren;/, '¤') #'General currency sign
- para.gsub!(/&yen;/, '¥') #'Yen sign ¥
- para.gsub!(/&brvbar;/, '¦') #'Broken vertical bar
- para.gsub!(/&sect;/, '§') #'Section sign §
- para.gsub!(/&uml;/, '¨') #'Umlaut
- para.gsub!(/&copy;/, '©') #'Copyright ©
- para.gsub!(/&ordf;/, 'ª') #'Feminine ordinal ª
- para.gsub!(/&laquo;/, '«') #'Left angle quote «
- para.gsub!(/&not;/, '¬') #'Not sign
- para.gsub!(/&shy;/, '­') #'Soft hyphen
- para.gsub!(/&reg;/, '®') #'Registered trademark ®
- para.gsub!(/&macr;/, '¯') #'Macron accent
- para.gsub!(/&deg;/, '°') #'Degree sign °
- para.gsub!(/&plusmin;/,'±') #'Plus or minus ±
- para.gsub!(/&sup2;/, '²') #'Superscript 2 ²
- para.gsub!(/&sup3;/, '³') #'Superscript 3 ³
- para.gsub!(/&acute;/, '') #'Acute accent
- para.gsub!(/&micro;/, 'µ') #'Micro sign (Greek mu) µ
- para.gsub!(/&para;/, '¶') #'Paragraph sign ¶
- para.gsub!(/&middot;/, '·') #'Middle dot
- para.gsub!(/&cedil;/, '¸') #'Cedilla
- para.gsub!(/&sup1;/, '¹') #'Superscript 1 ¹
- para.gsub!(/&ordm;/, 'º') #'Masculine ordinal º
- para.gsub!(/&raquo;/, '»') #'Right angle quote
- para.gsub!(/&frac14;/, '¼') #'Fraction one quarter ¼
- para.gsub!(/&frac12;/, '½') #'Fraction on half ½
- para.gsub!(/&frac34;/, '¾') #'Fraction three quarters ¾
- para.gsub!(/&iquest;/, '¿') #'Inverted question mark ¿
- para.gsub!(/&Agrave;/, 'À') #'Capital A, grave accent À
- para.gsub!(/&Aacute;/, 'Á') #'Capital A, acute accent Á
- para.gsub!(/&Acirc;/, 'Â') #'Capital A, circumflex accent Â
- para.gsub!(/&Atilde;/, 'Ã') #'Capital A, tilde Ã
- para.gsub!(/&Auml;/, 'Ä') #'Capital A, umlaut Ä
- para.gsub!(/&Aring;/, 'Å') #'Capital A, ring Å
- para.gsub!(/&AElig;/, 'Æ') #'Capital AE ligature Æ
- para.gsub!(/&Ccedil;/, 'Ç') #'Capital C, cedilla Ç
- para.gsub!(/&Egrave;/, 'È') #'Capital E, grave accent È
- para.gsub!(/&Eacute;/, 'É') #'Capital E, acute accent É
- para.gsub!(/&Ecirc;/, 'Ê') #'Capital E, circumflex accent Ê
- para.gsub!(/&Euml;/, 'Ë') #'Capital E, umlaut Ë
- para.gsub!(/&Igrave;/, 'Ì') #'Capital I, grave accent Ì
- para.gsub!(/&Iacute;/, 'Í') #'Capital I, acute accent Í
- para.gsub!(/&Icirc;/, 'Î') #'Capital I, circumflex accent Î
- para.gsub!(/&Iuml;/, 'Ï') #'Capital I, umlaut Ï
- para.gsub!(/&ETH;/, 'Ð') #'Capital eth, Icelandic
- para.gsub!(/&Ntilde;/, 'Ñ') #'Capital N, tilde Ñ
- para.gsub!(/&Ograve;/, 'Ò') #'Capital O, grave accent Ò
- para.gsub!(/&Oacute;/, 'Ó') #'Capital O, acute accent Ó
- para.gsub!(/&Ocirc;/, 'Ô') #'Capital O, circumflex accent Ô
- para.gsub!(/&Otilde;/, 'Õ') #'Capital O, tilde Õ
- para.gsub!(/&Ouml;/, 'Ö') #'Capital O, umlaut Ö
- para.gsub!(/&times;/, '×') #'Multiply sign ×
- para.gsub!(/&Oslash;/, 'Ø') #'Capital O, slash Ø
- para.gsub!(/&Ugrave;/, 'Ù') #'Capital U, grave accent Ù
- para.gsub!(/&Uacute;/, 'Ú') #'Capital U, acute accent Ú
- para.gsub!(/&Ucirc;/, 'Û') #'Capital U, circumflex accent Û
- para.gsub!(/&Uuml;/, 'Ü') #'Capital U, umlaut Ü
- para.gsub!(/&Yacute;/, 'Ý') #'Capital Y, acute accent Ý
- para.gsub!(/&THORN;/, 'Þ') #'Capital thorn, Icelandic Þ
- para.gsub!(/&szlig;/, 'ß') #'Small sz ligature, German ß
- para.gsub!(/&agrave;/, 'à') #'Small a, grave accent à
- para.gsub!(/&aacute;/, 'á') #'Small a, acute accent á
- para.gsub!(/&acirc;/, 'â') #'Small a, circumflex accent â
- para.gsub!(/&atilde;/, 'ã') #'Small a, tilde ã
- para.gsub!(/&auml;/, 'ä') #'Small a, umlaut ä
- para.gsub!(/&aring;/, 'å') #'Small a, ring å
- para.gsub!(/&aelig;/, 'æ') #'Small ae ligature æ
- para.gsub!(/&ccedil;/, 'ç') #'Small c, cedilla ç
- para.gsub!(/&egrave;/, 'è') #'Small e, grave accent è
- para.gsub!(/&eacute;/, 'é') #'Small e, acute accent é
- para.gsub!(/&ecirc;/, 'ê') #'Small e, circumflex accent ê
- para.gsub!(/&euml;/, 'ë') #'Small e, umlaut ë
- para.gsub!(/&igrave;/, 'ì') #'Small i, grave accent ì
- para.gsub!(/&iacute;/, 'í') #'Small i, acute accent í
- para.gsub!(/&icirc;/, 'î') #'Small i, circumflex accent î
- para.gsub!(/&iuml;/, 'ï') #'Small i, umlaut ï
- para.gsub!(/&eth;/, 'ð') #'Small eth, Icelandic ð
- para.gsub!(/&ntilde;/, 'ñ') #'Small n, tilde ñ
- para.gsub!(/&ograve;/, 'ò') #'Small o, grave accent ò
- para.gsub!(/&oacute;/, 'ó') #'Small o, acute accent ó
- para.gsub!(/&ocirc;/, 'ô') #'Small o, circumflex accent ô
- para.gsub!(/&otilde;/, 'õ') #'Small o, tilde õ
- para.gsub!(/&ouml;/, 'ö') #'Small o, umlaut ö
- para.gsub!(/&divide;/, '÷') #'Divide sign ÷
- para.gsub!(/&oslash;/, 'ø') #'Small o, slash ø
- para.gsub!(/&ugrave;/, 'ù') #'Small u, grave accent ù
- para.gsub!(/&uacute;/, 'ú') #'Small u, acute accent ú
- para.gsub!(/&ucirc;/, 'û') #'Small u, circumflex accent û
- para.gsub!(/&uuml;/, 'ü') #'Small u, umlaut ü
- para.gsub!(/&yacute;/, 'ý') #'Small y, acute accent ý
- para.gsub!(/&thorn;/, 'þ') #'Small thorn, Icelandic þ
- para.gsub!(/&yuml;/, 'ÿ') #'Smally y, umlaut ÿ
- ##
- para.gsub!(/\s\s+/,' ')
- para.gsub!(/\t+/,' ')
- #para.gsub!(/ +/,' ')
- #para.gsub!(/^(?:<(?:\/)?[bi]>)+$/i, '')
- tuned_file << para unless para == nil
- end
- tuned_file
- end
- end
- class Default < Html
- def initialize(data, filename, instruct)
- @data=data
- @filename=filename
- @instruct=instruct
- end
- def songsheet
- data=@data
- print "Convert to SiSU file from #{@filename}.html << gvim ,,#{@filename}.sst >\n" #: <<#{@@html_title}>>
- data=Default.new(data.collect, @filename, @instruct).space_paragraphs
- data=Default.new(data.collect, @filename, @instruct).multiline
- data=Default.new(data.collect.join.split("\n\n"), @filename, @instruct).markup_rules
- data=Default.new(data.collect, @filename, @instruct).markup_default
- data=MyOutput.new(data.collect, @filename, @instruct).hardOutput
- end
- def markup_default
- data=@data
- tuned_file=Array.new
- data.each do |para|
- para.gsub!(/<i>(Id\.?)(\s|$)/i,'/\{\1\}\2/')
- para.gsub!(/^(~\{\{ .+?)(<\/LI>\s*|<\/OL>\s*)+$/i,'\1')
- para.gsub!(/\/\{Id\.\s*<\/LI>\s*\}\//i,'/{Id.}/')
- tuned_file << para unless para == nil
- end
- tuned_file
- end
- end
-end
-def help
- puts <<WOK
-conversion program
-initial SiSU markup from other file formats
-
- zxy_convert --word does initial conversion from word97 to sisu markup, expects [filename].doc (can also use --doc)
- zxy_convert --html does initial conversion from html to sisu markup, expects [filename].html
- zxy_convert --default does initial conversion from defalt html to sisu markup, expects [filename].html
-
-WOK
-end
-def do_word(argv, instruct)
- argv.each do |f|
- if f =~/.+?\.doc$/
- @argv << f[/(.+?)\.doc$/, 1]
- else
- print "not .doc? << #{f} >> "
- end
- end
- @argv.each do |filename|
- system(%{wvWare -x #{@dir.path.home}/.sisu/convert/wvSiSU.xml #{filename}.doc > #{filename}.wv})
- file_array=IO.readlines("#{filename}.wv", "")
- CONVERT::WareWord97.new(file_array, filename, instruct).songsheet # metaverse created here
- end
-end
-def do_html(argv, instruct)
- argv.each do |f|
- if f =~/.+?\.html?$/
- @argv << f[/(.+?)\.html?$/, 1]
- else
- print "not .html? << #{f} >> "
- end
- end
- @argv.each do |filename|
- file_end=if FileTest.file?("#{filename}.html")
- 'html'
- elsif FileTest.file?("#{filename}.htm")
- 'htm'
- end
- file_array=IO.readlines("#{filename}.#{file_end}","\n\r")
- CONVERT::Html.new(file_array,filename,instruct).songsheet # metaverse created here
- end
-end
-def do_default(argv, instruct)
- argv.each do |f|
- if f =~/.+?\.html$/
- @argv << f[/(.+?)\.html$/, 1]
- else
- print "not .html? << #{f} >> "
- end
- end
- @argv.each do |filename|
- file_array=IO.readlines("#{filename}.html", "\n\r")
- CONVERT::Default.new(file_array, filename, instruct).songsheet # metaverse created here
- end
-end
-def cases(argv, instruct)
- case instruct
- when/^--(word(97)?|doc)$/i #creates minimal sisu_small.gz package to send
- do_word(argv, instruct)
- when/^--(html)$/i #creates sisu.gz package to send
- do_html(argv, instruct)
- when/^--(default)$/i #creates sisu.gz package to send
- do_default(argv, instruct)
- else
- help
- end
-end
-$KCODE='u'
-branch='v2'
-@argv=Array.new
-argv=$*
-SiSU_version_dir=(argv.inspect=~/--v1/) ? 'v1' : 'v2'
-SiSU_lib="sisu/#{SiSU_version_dir}"
-require "#{SiSU_lib}/sysenv"
-include SiSU_Env
-@dir=SiSU_Env::Info_env.new
-instruct = "#{argv[0].to_s}"
-argv.shift
-instruct.chomp!
-instruct = "help" if instruct.nil? or instruct == "";
-cases(argv, instruct)
diff --git a/data/sisu/v4/conf/convert/wvHtml.xml b/data/sisu/v4/conf/convert/wvHtml.xml
deleted file mode 100644
index 3cc9dd29..00000000
--- a/data/sisu/v4/conf/convert/wvHtml.xml
+++ /dev/null
@@ -1,388 +0,0 @@
-<main>
-<charentity>
-<begin>HTML</begin>
-</charentity>
-
-<document>
-<begin>&lt;!DOCTYPE HTML PUBLIC &quot;-//W3C//DTD HTML 4.0 Transitional//EN&quot; &quot;http://www.w3.org/TR/REC-html40/loose.dtd&quot;&gt;
-&lt;html&gt;
-&lt;head&gt;
-&lt;META HTTP-EQUIV=&quot;Content-Type&quot; CONTENT=&quot;text/html; charset=<charset/>&quot;&gt;
-&lt;META NAME=&quot;GENERATOR&quot; CONTENT=&quot;wvWare/<version/>&quot;&gt;
-&lt;title&gt;
-<title/>
-&lt;/title&gt;
-&lt;/head&gt;
-&lt;body bgcolor=&quot;#FFFFFF&quot; text=&quot;#000000&quot; link=&quot;#0000ee&quot; vlink=&quot;#551a8b&quot;&gt;
-</begin>
-<end>
-&lt;!--
-&lt;hr&gt;
-&lt;address&gt;
-&lt;a href=&quot;http://wvware.sourceforge.net/&quot;&gt;&lt;img
-src=&quot;wvSmall.gif&quot; height=31 width=47
-align=left border=0 alt=&quot;wvWare&quot;&gt;&lt;/a&gt;
-&lt;a href=&quot;http://validator.w3.org/check/referer&quot;&gt;&lt;img
-src=&quot;vh40.gif&quot; height=31 width=88
-align=right border=0 alt=&quot;Valid HTML 4.0!&quot;&gt;&lt;/a&gt;
-Document created with &lt;a href=&quot;http://wvware.sourceforge.net/&quot;&gt;wvWare/<version/>&lt;/a&gt;&lt;br&gt;
-&lt;/address&gt;
---&gt;
-&lt;/body&gt;
-&lt;/html&gt;
-</end>
-</document>
-
-<section>
-<begin>
-&lt;!--Section Begins--&gt;&lt;br&gt;
-</begin>
-<end>
-&lt;!--Section Ends--&gt;
-</end>
-</section>
-
-<justification>
-<left>left</left>
-<right>right</right>
-<center>center</center>
-<block>left</block>
-<asian>&lt;!--Could Someone who sees this tag tell me what was is this type of justification, asian languages only i thing--&gt;</asian>
-</justification>
-
-<numbering>
-<Arabic>type=&quot;1&quot;</Arabic>
-<UpperRoman>type=&quot;I&quot;</UpperRoman>
-<LowerRoman>type=&quot;i&quot;</LowerRoman>
-<UpperCaseN>type=&quot;A&quot;</UpperCaseN>
-<LowerCaseN>type=&quot;a&quot;</LowerCaseN>
-</numbering>
-
-<border>
-<noned>none</noned>
-<singled>solid</singled>
-<thickd>solid</thickd>
-<doubled>double</doubled>
-<number4d>double</number4d>
-<hairlined>solid</hairlined>
-<dotd>dotted</dotd>
-<dashlargegapd>dashed</dashlargegapd>
-<dotdashd>dotted</dotdashd>
-<dotdotdashd>dotted</dotdotdashd>
-<tripled>double</tripled>
-<thin-thicksmallgapd>dashed</thin-thicksmallgapd>
-<thick-thinsmallgapd>dashed</thick-thinsmallgapd>
-<thin-thick-thinsmallgapd>dashed</thin-thick-thinsmallgapd>
-<thin-thickmediumgapd>dashed</thin-thickmediumgapd>
-<thick-thinmediumgapd>dashed</thick-thinmediumgapd>
-<thin-thick-thinmediumgapd>dashed</thin-thick-thinmediumgapd>
-<thin-thicklargegapd>dashed</thin-thicklargegapd>
-<thick-thinlargegapd>dashed</thick-thinlargegapd>
-<thin-thick-thinlargegapd>dashed</thin-thick-thinlargegapd>
-<waved>solid</waved>
-<doublewaved>double</doublewaved>
-<dashsmallgapd>sashed</dashsmallgapd>
-<dashdotstrokedd>dashed</dashdotstrokedd>
-<emboss3Dd>ridge</emboss3Dd>
-<engrave3Dd>groove</engrave3Dd>
-<defaultd>ridge</defaultd>
-</border>
-
-<!-- <begin>&lt;ol <nfc/> start=&quot;<start/>&quot;&gt; -->
-<olist>
-<begin>&lt;ol <nfc/>&gt;
-</begin>
-<end>&lt;/ol&gt;</end>
-</olist>
-
-<ulist>
-<begin>&lt;ul&gt;
-</begin>
-<end>&lt;/ul&gt;</end>
-</ulist>
-
-<!-- <begin>&lt;li&gt;</begin> -->
-<entry>
-<begin>&lt;li value=&quot;<start/>&quot;&gt;</begin>
-<end>&lt;/li&gt;</end>
-</entry>
-
-
-<!--
-this tableoverride option can be used to turn off handling of
-these tags in tables, which I find is necessary for at least netscape
--->
-<tableoverrides>
-<ParaBefore>0</ParaBefore>
-<ParaRight>0</ParaRight>
-<ParaAfter>0</ParaAfter>
-<ParaLeft>0</ParaLeft>
-<ParaLeft1>0</ParaLeft1>
-<VertMergedCells>0</VertMergedCells>
-</tableoverrides>
-
-<table>
-<begin>&lt;table width=&quot;<tablerelwidth/>%&quot; border=&quot;1&quot; cols=&quot;<no_cols/>&quot; rows=&quot;<no_rows/>&quot;&gt;</begin>
-<end>&lt;/table&gt;</end>
-</table>
-
-<row>
-<begin>&lt;tr&gt;</begin>
-<end>&lt;/tr&gt;</end>
-</row>
-
-<cell>
-<begin>&lt;td bgcolor=&quot;<cellbgcolor/>&quot; width=&quot;<cellrelwidth/>%&quot; rowspan=&quot;<rowspan/>&quot; colspan=&quot;<colspan/>&quot;&gt;</begin>
-<end>&lt;/td&gt;</end>
-</cell>
-
-<paragraph>
-<begin>
-<table.end/>
-<table.begin/>
-<row.begin/><cell.begin/><olist.end/><olist.begin/><ulist.end/><ulist.begin/><entry.begin/><text.begin/>
-</begin>
-<end>
-<text.end/><entry.end/><olist.end/><ulist.end/><cell.end/><row.end/>
-</end>
-</paragraph>
-
-<!-- these are all the character properties that can show up in word -->
-<bold><begin>&lt;b&gt;</begin><end>&lt;/b&gt;</end></bold>
-<italic><begin>&lt;i&gt;</begin><end>&lt;/i&gt;</end></italic>
-
-<!--
-text that has been deleted and will be displayed with strikethrough when
-revision marked text is to be displayed
-
-use either this line...
--->
-<RMarkDel><begin>&lt;s&gt;</begin><end>&lt;/s&gt;&lt;a href=&quot;#author<ibstRMarkDel/>&quot;&gt;[Author ID<ibstRMarkDel/>: at <dttmRMarkDel/> ]&lt;/a&gt;</end></RMarkDel>
-
-<!--
-or uncomment below to make deleted text dissappear (well, become commented out)
--->
-<!--
-<RMarkDel><begin>&lt;!-&#45;</begin><end>-&#45;&gt;</end></RMarkDel>
--->
-
-<!-- Overwriting char props. like CaPs->CAPS SmallCaps->smallcaps -->
-<outline><begin></begin><end></end></outline>
-<smallcaps><begin>&lt;span style=&quot;text-transform:lowercase&quot;&gt;</begin><end>&lt;/span&gt;</end></smallcaps>
-<caps><begin>&lt;span style=&quot;text-transform:uppercase&quot;&gt;</begin><end>&lt;/span&gt;</end></caps>
-<vanish><begin></begin><end></end></vanish>
-
-<!--If you uncomment this then the annotation text links will become commented out by html tags-->
-<!--
-<vanish><begin>&lt;!-&#45;</begin><end>-&#45;&gt;</end></vanish>
--->
-
-<!--
-text that has been newly typed since the last time revision marks have been accepted
-and will be displayed with underline when revision marked text is to be displayed
-
-use either this line...
--->
-<RMark><begin>&lt;u&gt;</begin><end>&lt;/u&gt;&lt;a href=&quot;#author<ibstRMark/>&quot;&gt;[Author ID<ibstRMark/>: at <dttmRMark/>]&lt;/a&gt;</end></RMark>
-
-<!--
-or uncomment below to make the underline dissappear
--->
-<!--
-<RMark><begin></begin><end></end></RMark>
--->
-
-
-<strike><begin>&lt;s&gt;</begin><end>&lt;/s&gt;</end></strike>
-<shadow><begin></begin><end></end></shadow>
-<lowercase><begin></begin><end></end></lowercase>
-<emboss><begin></begin><end></end></emboss>
-<imprint><begin></begin><end></end></imprint>
-<!--double strike-->
-<dstrike><begin>&lt;s&gt;</begin><end>&lt;/s&gt;</end></dstrike>
-
-<!--
-ftc's
-&
-hps
-
-keep them for font face and do that later.
--->
-
-<super><begin>&lt;sup&gt;</begin><end>&lt;/sup&gt;</end></super>
-<sub><begin>&lt;sub&gt;</begin><end>&lt;/sub&gt;</end></sub>
-
-<singleu><begin>&lt;u&gt;</begin><end>&lt;/u&gt;</end></singleu>
-<wordu><begin>&lt;u&gt;</begin><end>&lt;/u&gt;</end></wordu>
-<doubleu><begin>&lt;u&gt;</begin><end>&lt;/u&gt;</end></doubleu>
-<dottedu><begin>&lt;u&gt;</begin><end>&lt;/u&gt;</end></dottedu>
-<hiddenu><begin>&lt;u&gt;</begin><end>&lt;/u&gt;</end></hiddenu>
-<thicku><begin>&lt;u&gt;</begin><end>&lt;/u&gt;</end></thicku>
-<dashu><begin>&lt;u&gt;</begin><end>&lt;/u&gt;</end></dashu>
-<dotu><begin>&lt;u&gt;</begin><end>&lt;/u&gt;</end></dotu>
-<dotdashu><begin>&lt;u&gt;</begin><end>&lt;/u&gt;</end></dotdashu>
-<dotdotdashu><begin>&lt;u&gt;</begin><end>&lt;/u&gt;</end></dotdotdashu>
-<waveu><begin>&lt;u&gt;</begin><end>&lt;/u&gt;</end></waveu>
-
-<!--
-text whose properties have been changed since the last time revision marks have been accepted
-and will be displayed with a note showing the change points.
-
-use either this line (which admit it a bit scary looking, but harmless)...
--->
-<PropRMark><begin>&lt;a href=&quot;#author<ibstPropRMark/>&quot;&gt;-&#45;&amp;gt;&lt;/a&gt;</begin><end>&lt;a href=&quot;#author<ibstPropRMark/>&quot;&gt;[Author ID<ibstPropRMark/>: at <dttmPropRMark/>]&lt;/a&gt;</end></PropRMark>
-
-<!--
-or uncomment below to make the notes dissappear
--->
-<!--
-<PropRMark><begin></begin><end></end></PropRMark>
--->
-
-<!--
-<color>
--->
-<Black><begin>Black</begin><end></end></Black>
-<Blue><begin>Blue</begin><end></end></Blue>
-<Cyan><begin>Cyan</begin><end></end></Cyan>
-<Green><begin>Green</begin><end></end></Green>
-<Magenta><begin>Magenta</begin><end></end></Magenta>
-<Red><begin>Red</begin><end></end></Red>
-<Yellow><begin>Yellow</begin><end></end></Yellow>
-<White><begin>White</begin><end></end></White>
-<DkBlue><begin>DarkBlue</begin><end></end></DkBlue>
-<DkCyan><begin>DarkCyan</begin><end></end></DkCyan>
-<DkGreen><begin>DarkGreen</begin><end></end></DkGreen>
-<DkMagenta><begin>DarkMagenta</begin><end></end></DkMagenta>
-<DkRed><begin>DarkRed</begin><end></end></DkRed>
-<DkYellow><begin>#8b8b00</begin><end></end></DkYellow>
-<DkGray><begin>DarkGray</begin><end></end></DkGray>
-<LtGray><begin>LightGrey</begin><end></end></LtGray>
-<!--
-</color>
--->
-
-<!--
-<animation>
--->
-<LasVegas><begin>&lt;blink&gt;</begin><end>&lt;/blink&gt;</end></LasVegas>
-<BackgroundBlink><begin>&lt;blink&gt;</begin><end>&lt;/blink&gt;</end></BackgroundBlink>
-<SparkleText><begin>&lt;blink&gt;</begin><end>&lt;/blink&gt;</end></SparkleText>
-<MarchingAnts><begin>&lt;blink&gt;</begin><end>&lt;/blink&gt;</end></MarchingAnts>
-<MarchingRedAnts><begin>&lt;blink&gt;</begin><end>&lt;/blink&gt;</end></MarchingRedAnts>
-<Shimmer><begin>&lt;blink&gt;</begin><end>&lt;/blink&gt;</end></Shimmer>
-<!--
-</animation>
--->
-
-<!--
-I dont understand what this one is, and ive never come across it
-
-use this sample line (which admit it a bit scary looking, but harmless)...
--->
-<DispFldRMark><begin>&lt;a href=&quot;#author<ibstDispFldRMark/>&quot;&gt;--&amp;gt;&lt;/a&gt;</begin><end>&lt;a href=&quot;#author<ibstDispFldRMark/>&quot;&gt;[Author ID<ibstDispFldRMark/>: at <dttmDispFldRMark/> (<xstDispFldRMark/>)]&lt;/a&gt;</end></DispFldRMark>
-
-<!--
-or uncomment below to ignore it, the previous might even crash wv ?
--->
-<!--
-<DispFldRMark><begin></begin><end></end></DispFldRMark>
--->
-
-<animation>
-<begin><LasVegas.begin/><BackgroundBlink.begin/><SparkleText.begin/><MarchingAnts.begin/><MarchingRedAnts.begin/><Shimmer.begin/></begin>
-<end><Shimmer.end/><MarchingRedAnts.end/><MarchingAnts.end/><SparkleText.end/><BackgroundBlink.end/><LasVegas.end/></end>
-</animation>
-
-<fontstr>
-<begin>&lt;font color=&quot;<black.begin/><blue.begin/><cyan.begin/><green.begin/><magenta.begin/><red.begin/><yellow.begin/><white.begin/><dkblue.begin/><dkcyan.begin/><dkgreen.begin/><dkmagenta.begin/><dkred.begin/><dkyellow.begin/><dkgray.begin/><ltgray.begin/>&quot;&gt;</begin>
-<end><ltgray.end/><dkgray.end/><dkyellow.end/><dkred.end/><dkmagenta.end/><dkgreen.end/><dkcyan.end/><dkblue.end/><white.end/><yellow.end/><red.end/><magenta.end/><green.end/><cyan.end/><blue.end/><black.end/>&lt;/font&gt;</end>
-</fontstr>
-
-<comment>
-<begin>
-&lt;a href=&quot;#comment<ibstAnno/> &quot;&gt;-&#45;&amp;gt;&lt;/a&gt;
-</begin>
-<end>&lt;a href=&quot;#comment<ibstAnno/> &quot;&gt;[Author:<xstUsrInitl/>]&lt;/a&gt;
-</end>
-</comment>
-
-<style name="Normal">
-<character>
-<begin><PropRMark.begin/><DispFldRMark.begin/><animation.begin/><fontstr.begin/><bold.begin/><italic.begin/><strike.begin/><RMarkDel.begin/><outline.begin/><smallcaps.begin/><caps.begin/><vanish.begin/><RMark.begin/><shadow.begin/><lowercase.begin/><emboss.begin/><imprint.begin/><dstrike.begin/><super.begin/><sub.begin/><singleu.begin/><wordu.begin/><doubleu.begin/><dottedu.begin/><hiddenu.begin/><thicku.begin/><dashu.begin/><dotu.begin/><dotdashu.begin/><dotdotdashu.begin/><waveu.begin/></begin>
-<end><waveu.end/><dotdotdashu.end/><dotdashu.end/><dotu.end/><dashu.end/><thicku.end/><hiddenu.end/><dottedu.end/><doubleu.end/><wordu.end/><singleu.end/><sub.end/><super.end/><dstrike.end/><imprint.end/><emboss.end/><lowercase.end/><shadow.end/><RMark.end/><vanish.end/><caps.end/><smallcaps.end/><outline.end/><RMarkDel.end/><strike.end/><italic.end/><bold.end/><fontstr.end/><animation.end/><DispFldRMark.end/><PropRMark.end/></end>
-</character>
-
-<!-- Netscape does handle this correctly yet, here is how each different side of the border should work.
-border-top: thin <bordertopstyle/> <bordertopcolor/>;
-border-left: thin <borderleftstyle/> <borderleftcolor/>;
-border-right: thin <borderrightstyle/> <borderrightcolor/>;
-border-bottom: thin <borderbottomstyle/> <borderbottomcolor/>
--->
-
-
-<pmargin>
-<begin>margin: <mmParaBefore/> <mmParaRight/> <mmParaAfter/> <mmParaLeft/>;</begin>
-</pmargin>
-
-<pborder>
-<begin>
-border: thin <borderleftstyle/> <borderleftcolor/>;
-<!--
-border-top: thin <bordertopstyle/> <bordertopcolor/>;
-border-left: thin <borderleftstyle/> <borderleftcolor/>;
-border-right: thin <borderrightstyle/> <borderrightcolor/>;
-border-bottom: thin <borderbottomstyle/> <borderbottomcolor/>
--->
-</begin>
-</pborder>
-
-<text>
-<begin>&lt;p&gt;&lt;div name=&quot;<stylename/>&quot; align=&quot;<just/>&quot; style=&quot;<paramargin/> <paraborder/> padding: <mmPadTop/> <mmPadRight/> <mmPadBottom/> <mmPadLeft/>; &quot;&gt;
-
-&lt;p style=&quot;text-indent: <mmParaLeft1/>; text-align: <just/>; line-height: <mmLineHeight/>; color: <parafgcolor/>; background-color: <parabgcolor/>; &quot;&gt;</begin>
-
-<end>&lt;/p&gt;&lt;/div&gt;</end>
-</text>
-
-<picture>
-<begin>
-&lt;img <htmlAlignGuess/> width=&quot;<pixPicWidth/>&quot; height=&quot;<pixPicHeight/>&quot; alt=&quot;0x01 graphic&quot; src=&quot;placeholder.png&quot;&gt;<htmlNextLineGuess/>
-</begin>
-</picture>
-
-</style>
-
-<!--we need to be override the character properties-->
-<!--
-<style name="Normal">
-<character>
-<begin><PropRMark.begin/><DispFldRMark.begin/><animation.begin/><fontstr.begin/><bold.begin/><italic.begin/><strike.begin/><RMarkDel.begin/><outline.begin/><smallcaps.begin/><caps.begin/><vanish.begin/><RMark.begin/><shadow.begin/><lowercase.begin/><emboss.begin/><imprint.begin/><dstrike.begin/><super.begin/><sub.begin/><singleu.begin/><wordu.begin/><doubleu.begin/><dottedu.begin/><hiddenu.begin/><thicku.begin/><dashu.begin/><dotu.begin/><dotdashu.begin/><dotdotdashu.begin/><waveu.begin/></begin>
-<end><waveu.end/><dotdotdashu.end/><dotdashu.end/><dotu.end/><dashu.end/><thicku.end/><hiddenu.end/><dottedu.end/><doubleu.end/><wordu.end/><singleu.end/><sub.end/><super.end/><dstrike.end/><imprint.end/><emboss.end/><lowercase.end/><shadow.end/><RMark.end/><vanish.end/><caps.end/><smallcaps.end/><outline.end/><RMarkDel.end/><strike.end/><italic.end/><bold.end/><fontstr.end/><animation.end/><DispFldRMark.end/><PropRMark.end/></end>
-</character>
-
-<text>
-<begin>&lt;div name=&quot;<stylename/>&quot; align=&quot;<just/>&quot;&gt;&lt;p&gt;</begin>
-<end>&lt;/p&gt;&lt;/div&gt;</end>
-</text>
-
-</style>
-
-<style name="Heading 1">
-
-<character>
-<begin></begin>
-<end></end>
-</character>
-
-<text>
-<begin>&lt;div name=&quot;<stylename/>&quot; align=&quot;<just/>&quot;&gt;&lt;H1&gt;</begin>
-<end>&lt;/H1&gt;&lt;/div&gt;</end>
-</text>
-
-
-
-</style>
--->
-
-</main>
diff --git a/data/sisu/v4/conf/convert/wvSiSU.xml b/data/sisu/v4/conf/convert/wvSiSU.xml
deleted file mode 100644
index 271b00ff..00000000
--- a/data/sisu/v4/conf/convert/wvSiSU.xml
+++ /dev/null
@@ -1,360 +0,0 @@
-<main>
-<charentity>
-<begin>HTML</begin>
-</charentity>
-<!-- wvWare -x wvSiSU.xml [inputfile.doc] [outputfile.html] -->
-
-<document>
-<begin>
-</begin>
-<end>
-</end>
-</document>
-
-<section>
-<begin>
-</begin>
-<end>
-</end>
-</section>
-
-<justification>
-<left>left</left>
-<right>right</right>
-<center>center</center>
-<block>left</block>
-<asian>&lt;!--Could Someone who sees this tag tell me what was is this type of justification, asian languages only i thing--&gt;</asian>
-</justification>
-
-<numbering>
-<Arabic>type=&quot;1&quot;</Arabic>
-<UpperRoman>type=&quot;I&quot;</UpperRoman>
-<LowerRoman>type=&quot;i&quot;</LowerRoman>
-<UpperCaseN>type=&quot;A&quot;</UpperCaseN>
-<LowerCaseN>type=&quot;a&quot;</LowerCaseN>
-</numbering>
-
-<border>
-<noned>none</noned>
-<singled>solid</singled>
-<thickd>solid</thickd>
-<doubled>double</doubled>
-<number4d>double</number4d>
-<hairlined>solid</hairlined>
-<dotd>dotted</dotd>
-<dashlargegapd>dashed</dashlargegapd>
-<dotdashd>dotted</dotdashd>
-<dotdotdashd>dotted</dotdotdashd>
-<tripled>double</tripled>
-<thin-thicksmallgapd>dashed</thin-thicksmallgapd>
-<thick-thinsmallgapd>dashed</thick-thinsmallgapd>
-<thin-thick-thinsmallgapd>dashed</thin-thick-thinsmallgapd>
-<thin-thickmediumgapd>dashed</thin-thickmediumgapd>
-<thick-thinmediumgapd>dashed</thick-thinmediumgapd>
-<thin-thick-thinmediumgapd>dashed</thin-thick-thinmediumgapd>
-<thin-thicklargegapd>dashed</thin-thicklargegapd>
-<thick-thinlargegapd>dashed</thick-thinlargegapd>
-<thin-thick-thinlargegapd>dashed</thin-thick-thinlargegapd>
-<waved>solid</waved>
-<doublewaved>double</doublewaved>
-<dashsmallgapd>sashed</dashsmallgapd>
-<dashdotstrokedd>dashed</dashdotstrokedd>
-<emboss3Dd>ridge</emboss3Dd>
-<engrave3Dd>groove</engrave3Dd>
-<defaultd>ridge</defaultd>
-</border>
-
-<!-- <begin>&lt;ol <nfc/> start=&quot;<start/>&quot;&gt; -->
-<olist>
-<begin>
-</begin>
-<end></end>
-</olist>
-
-<ulist>
-<begin>
-</begin>
-<end></end>
-</ulist>
-
-<!-- <begin>&lt;li&gt;</begin> -->
-<entry>
-<begin></begin>
-<end></end>
-</entry>
-
-
-<!--
-this tableoverride option can be used to turn off handling of
-these tags in tables, which I find is necessary for at least netscape
--->
-<tableoverrides>
-<ParaBefore>0</ParaBefore>
-<ParaRight>0</ParaRight>
-<ParaAfter>0</ParaAfter>
-<ParaLeft>0</ParaLeft>
-<ParaLeft1>0</ParaLeft1>
-<VertMergedCells>0</VertMergedCells>
-</tableoverrides>
-
-<table>
-<begin></begin>
-<end></end>
-</table>
-
-<row>
-<begin>&lt;tr&gt;</begin>
-<end>&lt;/tr&gt;</end>
-</row>
-
-<cell>
-<begin></begin>
-<end></end>
-</cell>
-
-<!-- EDITING OUT DID MUCH OF TRICK -->
-<paragraph>
-<begin>
-</begin>
-<end>
-</end>
-</paragraph>
-
-<!-- these are all the character properties that can show up in word -->
-<bold><begin>&lt;b&gt;</begin><end>&lt;/b&gt;</end></bold>
-<italic><begin>&lt;i&gt;</begin><end>&lt;/i&gt;</end></italic>
-
-<!--
-text that has been deleted and will be displayed with strikethrough when
-revision marked text is to be displayed
-
-use either this line...
--->
-<RMarkDel><begin>&lt;s&gt;</begin><end>&lt;/s&gt;&lt;a href=&quot;#author<ibstRMarkDel/>&quot;&gt;[Author ID<ibstRMarkDel/>: at <dttmRMarkDel/> ]&lt;/a&gt;</end></RMarkDel>
-
-<!--
-or uncomment below to make deleted text dissappear (well, become commented out)
--->
-<!--
-<RMarkDel><begin>&lt;!-&#45;</begin><end>-&#45;&gt;</end></RMarkDel>
--->
-
-<!-- Overwriting char props. like CaPs->CAPS SmallCaps->smallcaps -->
-<outline><begin></begin><end></end></outline>
-<smallcaps><begin></begin><end></end></smallcaps>
-<caps><begin></begin><end></end></caps>
-<vanish><begin></begin><end></end></vanish>
-
-<!--If you uncomment this then the annotation text links will become commented out by html tags-->
-<!--
-<vanish><begin>&lt;!-&#45;</begin><end>-&#45;&gt;</end></vanish>
--->
-
-<!--
-text that has been newly typed since the last time revision marks have been accepted
-and will be displayed with underline when revision marked text is to be displayed
-
-use either this line...
--->
-<RMark><begin></begin><end></end></RMark>
-
-<!--
-or uncomment below to make the underline dissappear
--->
-<!--
-<RMark><begin></begin><end></end></RMark>
--->
-
-
-<strike><begin>&lt;s&gt;</begin><end>&lt;/s&gt;</end></strike>
-<shadow><begin></begin><end></end></shadow>
-<lowercase><begin></begin><end></end></lowercase>
-<emboss><begin></begin><end></end></emboss>
-<imprint><begin></begin><end></end></imprint>
-<!--double strike-->
-<dstrike><begin>&lt;s&gt;</begin><end>&lt;/s&gt;</end></dstrike>
-
-<!--
-ftc's
-&
-hps
-
-keep them for font face and do that later.
--->
-
-<super><begin>&lt;sup&gt;</begin><end>&lt;/sup&gt;</end></super>
-<sub><begin>&lt;sub&gt;</begin><end>&lt;/sub&gt;</end></sub>
-
-<singleu><begin>&lt;u&gt;</begin><end>&lt;/u&gt;</end></singleu>
-<wordu><begin>&lt;u&gt;</begin><end>&lt;/u&gt;</end></wordu>
-<doubleu><begin>&lt;u&gt;</begin><end>&lt;/u&gt;</end></doubleu>
-<dottedu><begin>&lt;u&gt;</begin><end>&lt;/u&gt;</end></dottedu>
-<hiddenu><begin>&lt;u&gt;</begin><end>&lt;/u&gt;</end></hiddenu>
-<thicku><begin>&lt;u&gt;</begin><end>&lt;/u&gt;</end></thicku>
-<dashu><begin>&lt;u&gt;</begin><end>&lt;/u&gt;</end></dashu>
-<dotu><begin>&lt;u&gt;</begin><end>&lt;/u&gt;</end></dotu>
-<dotdashu><begin>&lt;u&gt;</begin><end>&lt;/u&gt;</end></dotdashu>
-<dotdotdashu><begin>&lt;u&gt;</begin><end>&lt;/u&gt;</end></dotdotdashu>
-<waveu><begin>&lt;u&gt;</begin><end>&lt;/u&gt;</end></waveu>
-
-<!--
-text whose properties have been changed since the last time revision marks have been accepted
-and will be displayed with a note showing the change points.
-
-use either this line (which admit it a bit scary looking, but harmless)...
--->
-<PropRMark><begin></begin><end></end></PropRMark>
-
-<!--
-or uncomment below to make the notes dissappear
--->
-<!--
-<PropRMark><begin></begin><end></end></PropRMark>
--->
-
-<!--
-<color>
--->
-<Black><begin>Black</begin><end></end></Black>
-<Blue><begin>Blue</begin><end></end></Blue>
-<Cyan><begin>Cyan</begin><end></end></Cyan>
-<Green><begin>Green</begin><end></end></Green>
-<Magenta><begin>Magenta</begin><end></end></Magenta>
-<Red><begin>Red</begin><end></end></Red>
-<Yellow><begin>Yellow</begin><end></end></Yellow>
-<White><begin>White</begin><end></end></White>
-<DkBlue><begin>DarkBlue</begin><end></end></DkBlue>
-<DkCyan><begin>DarkCyan</begin><end></end></DkCyan>
-<DkGreen><begin>DarkGreen</begin><end></end></DkGreen>
-<DkMagenta><begin>DarkMagenta</begin><end></end></DkMagenta>
-<DkRed><begin>DarkRed</begin><end></end></DkRed>
-<DkYellow><begin>#8b8b00</begin><end></end></DkYellow>
-<DkGray><begin>DarkGray</begin><end></end></DkGray>
-<LtGray><begin>LightGrey</begin><end></end></LtGray>
-<!--
-</color>
--->
-
-<!--
-<animation>
--->
-<LasVegas><begin>&lt;blink&gt;</begin><end>&lt;/blink&gt;</end></LasVegas>
-<BackgroundBlink><begin>&lt;blink&gt;</begin><end>&lt;/blink&gt;</end></BackgroundBlink>
-<SparkleText><begin>&lt;blink&gt;</begin><end>&lt;/blink&gt;</end></SparkleText>
-<MarchingAnts><begin>&lt;blink&gt;</begin><end>&lt;/blink&gt;</end></MarchingAnts>
-<MarchingRedAnts><begin>&lt;blink&gt;</begin><end>&lt;/blink&gt;</end></MarchingRedAnts>
-<Shimmer><begin>&lt;blink&gt;</begin><end>&lt;/blink&gt;</end></Shimmer>
-<!--
-</animation>
--->
-
-<!--
-I dont understand what this one is, and ive never come across it
-
-use this sample line (which admit it a bit scary looking, but harmless)...
--->
-<DispFldRMark><begin></begin><end></end></DispFldRMark>
-
-<!--
-or uncomment below to ignore it, the previous might even crash wv ?
--->
-<!--
-<DispFldRMark><begin></begin><end></end></DispFldRMark>
--->
-
-<animation>
-<begin></begin>
-<end></end>
-</animation>
-
-<fontstr>
-<begin></begin>
-<end></end>
-</fontstr>
-
-<comment>
-<begin>
-</begin>
-<end>
-</end>
-</comment>
-
-<style name="Normal">
-<character>
-<begin><bold.begin/><italic.begin/><strike.begin/><RMarkDel.begin/><outline.begin/><smallcaps.begin/><caps.begin/><vanish.begin/><RMark.begin/><shadow.begin/><lowercase.begin/><emboss.begin/><imprint.begin/><dstrike.begin/><super.begin/><sub.begin/><singleu.begin/><wordu.begin/><doubleu.begin/><dottedu.begin/><hiddenu.begin/><thicku.begin/><dashu.begin/><dotu.begin/><dotdashu.begin/><dotdotdashu.begin/><waveu.begin/></begin>
-<end><waveu.end/><dotdotdashu.end/><dotdashu.end/><dotu.end/><dashu.end/><thicku.end/><hiddenu.end/><dottedu.end/><doubleu.end/><wordu.end/><singleu.end/><sub.end/><super.end/><dstrike.end/><imprint.end/><emboss.end/><lowercase.end/><shadow.end/><RMark.end/><vanish.end/><caps.end/><smallcaps.end/><outline.end/><RMarkDel.end/><strike.end/><italic.end/><bold.end/></end>
-</character>
-
-<!-- KEEP
-<style name="Normal">
-<character>
-<begin><PropRMark.begin/><DispFldRMark.begin/><animation.begin/><fontstr.begin/><bold.begin/><italic.begin/><strike.begin/><RMarkDel.begin/><outline.begin/><smallcaps.begin/><caps.begin/><vanish.begin/><RMark.begin/><shadow.begin/><lowercase.begin/><emboss.begin/><imprint.begin/><dstrike.begin/><super.begin/><sub.begin/><singleu.begin/><wordu.begin/><doubleu.begin/><dottedu.begin/><hiddenu.begin/><thicku.begin/><dashu.begin/><dotu.begin/><dotdashu.begin/><dotdotdashu.begin/><waveu.begin/></begin>
-<end><waveu.end/><dotdotdashu.end/><dotdashu.end/><dotu.end/><dashu.end/><thicku.end/><hiddenu.end/><dottedu.end/><doubleu.end/><wordu.end/><singleu.end/><sub.end/><super.end/><dstrike.end/><imprint.end/><emboss.end/><lowercase.end/><shadow.end/><RMark.end/><vanish.end/><caps.end/><smallcaps.end/><outline.end/><RMarkDel.end/><strike.end/><italic.end/><bold.end/><fontstr.end/><animation.end/><DispFldRMark.end/><PropRMark.end/></end>
-</character>
--->
-
-<!-- Netscape does handle this correctly yet, here is how each different side of the border should work.
-border-top: thin <bordertopstyle/> <bordertopcolor/>;
-border-left: thin <borderleftstyle/> <borderleftcolor/>;
-border-right: thin <borderrightstyle/> <borderrightcolor/>;
-border-bottom: thin <borderbottomstyle/> <borderbottomcolor/>
--->
-
-
-<pmargin>
-<begin></begin>
-</pmargin>
-
-<pborder>
-<begin>
-</begin>
-</pborder>
-
-<text>
-<begin>
-
-<mmParaLeft1/></begin>
-
-<end></end>
-</text>
-
-<picture>
-<begin>
-</begin>
-</picture>
-
-</style>
-
-<!--we need to be override the character properties-->
-<!--
-<style name="Normal">
-<character>
-<begin><PropRMark.begin/><DispFldRMark.begin/><animation.begin/><fontstr.begin/><bold.begin/><italic.begin/><strike.begin/><RMarkDel.begin/><outline.begin/><smallcaps.begin/><caps.begin/><vanish.begin/><RMark.begin/><shadow.begin/><lowercase.begin/><emboss.begin/><imprint.begin/><dstrike.begin/><super.begin/><sub.begin/><singleu.begin/><wordu.begin/><doubleu.begin/><dottedu.begin/><hiddenu.begin/><thicku.begin/><dashu.begin/><dotu.begin/><dotdashu.begin/><dotdotdashu.begin/><waveu.begin/></begin>
-<end><waveu.end/><dotdotdashu.end/><dotdashu.end/><dotu.end/><dashu.end/><thicku.end/><hiddenu.end/><dottedu.end/><doubleu.end/><wordu.end/><singleu.end/><sub.end/><super.end/><dstrike.end/><imprint.end/><emboss.end/><lowercase.end/><shadow.end/><RMark.end/><vanish.end/><caps.end/><smallcaps.end/><outline.end/><RMarkDel.end/><strike.end/><italic.end/><bold.end/><fontstr.end/><animation.end/><DispFldRMark.end/><PropRMark.end/></end>
-</character>
-
-<text>
-<begin>&lt;div name=&quot;<stylename/>&quot; align=&quot;<just/>&quot;&gt;&lt;p&gt;</begin>
-<end>&lt;/p&gt;&lt;/div&gt;</end>
-</text>
-
-</style>
-
-<style name="Heading 1">
-
-<character>
-<begin></begin>
-<end></end>
-</character>
-
-<text>
-<begin>&lt;div name=&quot;<stylename/>&quot; align=&quot;<just/>&quot;&gt;&lt;H1&gt;</begin>
-<end>&lt;/H1&gt;&lt;/div&gt;</end>
-</text>
-
-
-
-</style>
--->
-
-</main>