diff options
author | Ralph Amissah <ralph.amissah@gmail.com> | 2007-06-02 11:27:06 +0100 |
---|---|---|
committer | Ralph Amissah <ralph.amissah@gmail.com> | 2007-06-02 11:27:06 +0100 |
commit | 26767cc88c0548ad7978021796d0ccc4c9f7ffed (patch) | |
tree | fe225e99e180b5d2925cbf776826f74db27e1888 /lib/sisu/0.52/sst_to_s_xml_dom.rb | |
parent | restrict use to ruby1.8 branch, i.e. < 1.9 (diff) |
0.53.0, pre-build, see changelog, library naming changed for scm, placed under v0 (instead of 0.53)upstream/0.53.0sisu_0.53.0
Diffstat (limited to 'lib/sisu/0.52/sst_to_s_xml_dom.rb')
-rw-r--r-- | lib/sisu/0.52/sst_to_s_xml_dom.rb | 563 |
1 files changed, 0 insertions, 563 deletions
diff --git a/lib/sisu/0.52/sst_to_s_xml_dom.rb b/lib/sisu/0.52/sst_to_s_xml_dom.rb deleted file mode 100644 index 9665250b..00000000 --- a/lib/sisu/0.52/sst_to_s_xml_dom.rb +++ /dev/null @@ -1,563 +0,0 @@ -=begin - * Name: SiSU information Structuring Universe - Structured information, Serialized Units - * Author: Ralph Amissah - * http://www.jus.uio.no/sisu - * http://www.jus.uio.no/sisu/SiSU/download.html - - * Description: simple xml representation (dom style) - - * Copyright (C) 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006, 2007 Ralph Amissah - - * License: GPL 2 or later - - Summary of GPL 2 - - This program is free software; you can redistribute it and/or modify it - under the terms of the GNU General Public License as published by the Free - Software Foundation; either version 2 of the License, or (at your option) - any later version. - - This program is distributed in the hope that it will be useful, but WITHOUT - ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or - FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for - more details. - - You should have received a copy of the GNU General Public License along - with this program; if not, write to the Free Software Foundation, Inc., - 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA - - If you have Internet connection, the latest version of the GPL should be - available at these locations: - http://www.fsf.org/licenses/gpl.html - http://www.gnu.org/copyleft/gpl.html - http://www.jus.uio.no/sisu/gpl2.fsf - - SiSU was first released to the public on January 4th 2005 - - SiSU uses: - - * Standard SiSU markup syntax, - * Standard SiSU meta-markup syntax, and the - * Standard SiSU object citation numbering and system - - © Ralph Amissah 1997, current 2007. - All Rights Reserved. - - * Ralph Amissah: ralph@amissah.com - ralph.amissah@gmail.com - - * Notes: tidy -xml sax.xml >> index.tidy -=end -module SiSU_simple_xml_model_dom - require SiSU_lib + '/defaults' - require SiSU_lib + '/param' - include SiSU_Param - include SiSU_Viz - require SiSU_lib + '/sysenv' - include SiSU_Env - require SiSU_lib + '/dal_doc_str' - require SiSU_lib + '/shared_xml' - require SiSU_lib + '/xml_format' - include SiSU_XML_format - include SiSU_XML_munge - require SiSU_lib + '/rexml' - include SiSU_Rexml - @@alt_id_count,@@tablehead,@@number_of_cols=0,0,0 - @@tablefoot='' - class Convert - @@fns=nil - def initialize(opt) - @opt=opt - end - def read - begin - @md=SiSU_Param::Parameters.new(@opt).get #bug, relies on info persistence, assumes -m has previously been run - @env=SiSU_Env::Info_env.new(@opt.fns) - path=@env.path.output_tell - loc=@env.url.output_tell - tool=if @opt.cmd =~/[MV]/; "#{Dir.pwd}/#{@md.fn[:sxd]}\n\t#{@env.program.xml_viewer} #{path}/#{@md.fnb}/#{@md.fn[:sxd]}" - elsif @opt.cmd =~/v/; "#{@env.program.web_browser} #{Dir.pwd}/#{@md.fn[:sxd]}" - else '' - end - SiSU_Screen::Ansi.new(@opt.cmd,'invert','XML DOM',"#{@md.fns} -> #{@md.fn[:sxd]}").colorize unless @opt.cmd =~/q/ - tell=SiSU_Screen::Ansi.new(@opt.cmd,@opt.fns,"#{Dir.pwd}/#{@md.fn[:sxd]}") - tell.flow if @opt.cmd =~/[MV]/ - unless @@fns==@opt.fns - @@fns=@opt.fns - @@dal_array=[] - end - @dal_array=if @@dal_array.empty?; read_fnm - else @@dal_array.dup # check - end - SiSU_simple_xml_model_dom::Convert::Songsheet.new(@dal_array,@md,@env).songsheet - rescue; SiSU_Errors::Info_error.new($!,$@,@opt.cmd,@opt.fns).error - ensure #file closed in songsheet - end - end - def read_fnm - dal=[] - if FileTest.file?("#{Dir.pwd}/#{@opt.fns}") - dal=IO.readlines("#{Dir.pwd}/#{@opt.fns}","\n\n") - else puts 'Error' - end - end - private - class Songsheet - def initialize(data,md,dir) - @data,@md,@env=data,md,dir - end - def songsheet - begin - SiSU_simple_xml_model_dom::Convert::Scroll.new(@data,@md).songsheet - SiSU_simple_xml_model_dom::Convert::Tidy.new(@md,@env).xml if @md.cmd =~/[vVM]/ # test wellformedness, comment out when not in use - SiSU_Rexml::Rexml.new(@md,@md.fn[:sxd]).xml if @md.cmd =~/M/ # test rexml parsing, comment out when not in use #debug - rescue; SiSU_Errors::Info_error.new($!,$@,@md.cmd,@md.fns).error - ensure - end - end - end - class Scroll - require SiSU_lib + '/shared_txt' - require SiSU_lib + '/css' - include SiSU_text_utils - @@xml={ :body=>[],:open=>[],:close=>[],:head=>[] } - def initialize(data='',md=nil) - @data,@md=data,md - @vz=SiSU_Env::Get_init.instance.skin - @regx=/^(?:(?:<:p[bn]>\s*)?(?::?[A-C]|\d~)(?:(\S+))?\s+)?(.+)/ - @tab="\t" - if @md - @env=SiSU_Env::Info_env.new(@md.fns) - @trans=SiSU_XML_munge::Trans.new(@md) - end - @sys=SiSU_Env::System_call.new - end - def songsheet - pre - markup - post - publish - end - protected - def embedded_endnotes(para='') - para.gsub!(/~\{(.+?)\}~/, - '<endnote><note>\1</note></endnote> ') - para.gsub!(/~\[([*+])\s+(.+?)\]~/, - '<endnote><symbol>\1</symbol><note>\2</note></endnote> ') - end - def xml_markup(para='') - para.gsub!(/~\[([*+])\s+(.+?)\]~/, - '<endnote><symbol>\1</symbol><note>\2</note></endnote> ') - para.gsub!(/~\{([*+]+)\s+(.+?)\}~/, - '<endnote><symbol>\1</symbol><note>\2</note></endnote> ') - para.gsub!(/~\{(.+?)\}~/, - '<endnote><note>\2</note></endnote> ') - end - def xml_head(meta) - txt=meta.text - txt.gsub!(/\/{(.+?)}\//,'<i>\1</i>') - txt.gsub!(/[*!]{(.+?)}[*!]/,'<b>\1</b>') - txt.gsub!(/_{(.+?)}_/,'<u>\1</u>') - txt.gsub!(/-{(.+?)}-/,'<del>\1</del>') - txt.gsub!(/<br(?: \/)?>/,'<br />') - txt.gsub!(/ & /,' and ') - @@xml[:head] <<<<WOK -#{@tab}<header class="#{meta.attrib}"> -#{@tab*2}<#{meta.el}> -#{@tab*3}#{txt} -#{@tab*2}</#{meta.el}> -#{@tab}</header> -WOK - end - def xml_sc(md='') - sc=if @md.sc_info - <<WOK - <source_control> - <sc class="sourcefile"> - #{@md.sc_filename} - </sc> - <sc class="number"> - #{@md.sc_number} - </sc> - <sc class="date"> - #{@md.sc_date} - </sc> - </source_control> -WOK - else '' - end - @@xml[:sc]=sc - end - def xml_element(lv='',para='',hname='',tag='',xml_element='',xml_content='') - lv=lv.to_i - n=lv - 1 - n1=lv - n2=lv + 1 - n3=lv + 2 - v=lv - 3 - tag='' - tag="\n#{@tab*n3}<nametag>#{hname}</nametag>\n" if hname - @@xml[:body] <<<<WOK -#{@tab*n}#{xml_element} -#{@tab*n1}<heading> -#{@tab*n2}<object> -#{@tab*n3}<text>#{para[@regx,2]}</text> -#{@tab*n2}</object> -#{@tab*n1}</heading>#{xml_content} -WOK - if lv == 4 - @copen[1]=true - @copen[2]=@copen[3]=false - elsif lv == 5 - @copen[2]=true - @copen[3]=false - elsif lv == 6 - @copen[3]=true - end - end - def xml_structure(lv='',para='',hname='' ) - puts lv if @md.cmd =~/[VM]/ - lv=lv.to_i - n=lv - 1 - n1=lv - n2=lv + 1 - n3=lv + 2 - v=lv - 3 - tag='' - tag="\n#{@tab*n3}<nametag>#{hname}</nametag>\n" if hname !=nil - case lv - when 1..3 - xml_element="<heading#{lv}>" - 3.downto(lv) do |x| - y=x - 1 - @@xml[:body] << "#{@tab*5}</content>\n" if @cont[1] or @cont[2] or @cont[3] - @cont[1]=false if @cont[1] - @cont[2]=false if @cont[2] - @cont[3]=false if @cont[3] - ####### attempt to close contents - if @copen[3] # 6{ - [3,2,1].each { |v| @@xml[:body] << "#{@tab*n}</contents#{v}>\n" } - @copen[1]=@copen[2]=@copen[3]=false - elsif @copen[2] # 5{ - [2,1].each { |v| @@xml[:body] << "#{@tab*n}</contents#{v}>\n" } - @copen[1]=@copen[2]=@copen[3]=false - elsif @copen[1] # 4{ - [1].each { |v| @@xml[:body] << "#{@tab*n}</contents#{v}>\n" } - @copen[1]=@copen[2]=@copen[3]=false - end - @@xml[:body] << "#{@tab*y}</heading#{x}>\n" if @level[x] - @level[x]=false - end - when 4..6 - 6.downto(lv) do |x| - y=x - 1 - if @level[x] == true - u=x - 3; - @xml_contents_close[x]='' - end - end - cv=lv - 3 - xml_element="<contents#{cv}>" - xml_content="\n#{@tab*5}<content>" - case lv - when 4 - @@xml[:body] << "#{@tab*5}</content>\n" if @cont[1] - if @copen[3] == true # 6{ - [3,2,1].each { |v| @@xml[:body] << "#{@tab*n}</contents#{v}>\n" } - elsif @copen[2] == true # 5{ - [2,1].each { |v| @@xml[:body] << "#{@tab*n}</contents#{v}>\n" } - elsif @copen[1] == true # 4{ - [1].each { |v| @@xml[:body] << "#{@tab*n}</contents#{v}>\n" } - end - @cont[1]=true - when 5 - @@xml[:body] << "#{@tab*5}</content>\n" if @cont[2] or @cont[1] - if @copen[3] == true #6{ - [3,2].each { |v| @@xml[:body] << "#{@tab*n}</contents#{v}>\n" } - elsif @copen[2] == true #5{ - [2].each { |v| @@xml[:body] << "#{@tab*n}</contents#{v}>\n" } - end - @cont[2]=true - when 6 - @@xml[:body] << "#{@tab*5}</content>\n" if @cont[3] or @cont[2] or @cont[1] - [3].each { |v| @@xml[:body] << "#{@tab*n}</contents#{v}>\n" } if @copen[3] - @cont[3]=true - end - end - xml_element(lv,para,hname,tag,xml_element,xml_content) - @level[lv]=true - ((lv+1)..6).each { |x| @level[x]=false } - end - def group_structure(para='') - para.gsub!(/<:group(?:-end)?>/,'') - para.strip! - @@xml[:body] << %{#{@tab*6}<object>} << "\n" - @@xml[:body] << %{#{@tab*7}<text class="group">#{@tab*1}\n} - @@xml[:body] << %{#{@tab*8}#{para}#{@tab*1}\n} - @@xml[:body] << %{#{@tab*7}</text>\n} - @@xml[:body] << "#{@tab*6}</object>" << "\n" - end - def poem_structure(para='') - para.gsub!(/<:verse(?:-end)?>/,'') - para.strip! - @@xml[:body] << %{#{@tab*6}<object>} << "\n" - @@xml[:body] << %{#{@tab*7}<text class="verse">#{@tab*1}\n} - @@xml[:body] << %{#{@tab*8}#{para}#{@tab*1}\n} - @@xml[:body] << %{#{@tab*7}</text>\n} - @@xml[:body] << "#{@tab*6}</object>" << "\n" - end - def code_structure(para='') - para.gsub!(/<:code(?:-end)?>/,'') - para.strip! - @@xml[:body] << %{#{@tab*6}<object>} << "\n" - @@xml[:body] << %{#{@tab*7}<text class="code">#{@tab*1}\n} - @@xml[:body] << %{#{@tab*8}#{para}#{@tab*1}\n} - @@xml[:body] << %{#{@tab*7}</text>\n} - @@xml[:body] << "#{@tab*6}</object>" << "\n" - end - def table_structure(table='') - @@xml[:body] << %{#{@tab*0}<object>} << "\n" - @@xml[:body] << %{#{@tab*1}#{table}\n#{@tab*1}\n} - @@xml[:body] << "#{@tab*0}</object>" << "\n" - @endnotes=[] - end - def tidywords(wordlist) - wordlist.each do |x| - x.gsub!(/&/,'&') unless x =~/&\S+;/ - end - end - def markup - data=@data - dir=SiSU_Env::Info_env.new(@md.fns) - xml_sc(@md) - @rcdc=false - @level,@cont,@copen,@xml_contents_close=[],[],[],[] - (0..6).each { |x| @cont[x]=@level[x]=false } - (4..6).each { |x| @xml_contents_close[x]='' } - data.each do |para| - wordlist=para.scan(/\S+|\n/) #\n needed for tables, check though added 2005w17 - para=tidywords(wordlist).join(' ').strip - para.gsub!(/<[-~]#>/,'') - para.gsub!(/<br\/?>/,'<br />') - para.gsub!(/<:pb>\s*/,'') - para.gsub!(/\{(\S+?\.(?:png|jpg|gif)) .+?\}(?:(?:https?|ftp):\/\/\S+|image)/, - "<image.path>#{dir.url.images_local}/\\1</image.path>") - para.gsub!(/ /,' ') - para=SiSU_document_structure::Structure.new(@md,para).structure - @trans.char_enc.utf8(para) if @sys.locale =~/utf-?8/i #% utf8 - if para =~/\A(?:@|0~)(\S+?):?\s+(.+?)\Z/m - d_meta=SiSU_text_utils::Header_scan.new(@md,para).meta - if d_meta; xml_head(d_meta) - end - end - @rcdc=true if @rcdc==false and (para =~/~metadata/ or para =~/^1~\s+Document Information/) - if para !~/(^0~|^@\S+?:|<ENDNOTES>|<EOF>)/ - @sto=SiSU_text_parts::Split_text_object.new(@md,para).lev_segname_para - unless @rcdc - if para !~/^(?:%\s|0~|@\S+?:)/ - format_scroll=SiSU_XML_format::Format_scroll.new(@md,@sto.text) if @sto.format =~/i[12]|null/ - case @sto.format - when /^(1)~(\S+)?/ - xml_markup(para) - xml_structure($1,para,$2) - para=@sto.lev_para_ocn.heading_body1 - when /^(2)~(\S+)?/ - xml_markup(para) - xml_structure($1,para,$2) - para=@sto.lev_para_ocn.heading_body2 - when /^(3)~(\S+)?/ - xml_markup(para) - xml_structure($1,para,$2) - para=@sto.lev_para_ocn.heading_body3 - when /^(4)~(\S+)?/ - xml_markup(para) - xml_structure($1,para,$2) - para=@sto.lev_para_ocn.heading_body4 - when /^(5)~(\S+)?/ - xml_markup(para) - xml_structure($1,para,$2) - para=@sto.lev_para_ocn.heading_body5 - when /^(6)~(\S+)?/ - xml_markup(para) - xml_structure($1,para,$2) - para=@sto.lev_para_ocn.heading_body6 - #when /^(i1)$/i - # #format_scroll.gsubBody - # #para=@sto.lev_para_ocn.scrIndent1 - #when /^(i2)$/i - # format_scroll.gsubBody - # para=@sto.lev_para_ocn.scrIndent2 - #when /^(center)$/i - # para.gsub!(/(.+)/, - # %{<center>(\\1)</center>}) - # para=@sto.lev_para_ocn.scrPara - #when /^(b|bold)$/i - # para.gsub!(/(.+)/, - # %{<b>(\\1)</b>}) - # para=@sto.lev_para_ocn.scrPara - #when /null/ # see whether u can improve - # if (para !~/#{@margin.txt_0}|#{@margin.txt_1}|#{@margin.txt_2}/) - # #format_scroll.gsubBody - # #para=@sto.lev_para_ocn.scrPara - # end - else - if para =~ /<:verse>/ - poem_structure(para) - elsif para =~ /<:group>/ - group_structure(para) - elsif para =~ /<:code>/ - para.gsub!(/</,'<') - para.gsub!(/>/,'>') - code_structure(para) - elsif para =~/<!Th?.+/ # tables come as single block #work area 2005w13 - table=SiSU_Tables::Table_xml.new(para) - para=table.table_split - @@xml[:body] << table_structure(para) - else #xml_structure - xml_markup(para) - @@xml[:body] << %{#{@tab*6}<object>} << "\n" if para[@regx] and para[@regx,2] - @@xml[:body] << "#{@tab*7}<text>#{para[@regx,2]}</text>\n" if para[@regx,2] # main text, contents, body KEEP - @@xml[:body] << "#{@tab*6}</object>" << "\n" if para[@regx] - end - end - elsif para =~/(Note|Endnotes?)/ - elsif para =~/(MetaData)/ and para =~/<~\d+;[m]\d+;\w\d+><#{@@dp}:#{@@dp}>$/ #debug 2003w46 add rc info - format_scroll=Format_scroll.new(@md,'<br /><a name="metadata">MetaData</a>') - para=format_scroll.bold_para - elsif para =~/(Owner Details)/ and para !~/<~\d+;(?:\w|[0-6]:)\d+;\w\d+><#{@@dp}:#{@@dp}>$/ - format_scroll=Format_scroll.new(@md,'<br /><a name="owner.details">Owner Details</a>') - @@xml[:owner_details]=format_scroll.bold_para - para='' - elsif para =~/(.*)<:#>(.*)/ - one,two=$1,$2 - format_text=Format_text_object.new(one,two) - para=format_text.seg_no_paranum - end - para='' if para =~/<a name="n\d+">/ and para =~/^(-\{{2}~\d+|<!e[:_]\d+!>)/ # -endnote - if para =~/.*<:#>.*$/ - para=case para - when /<:i1>/ - format_text=Format_text_object.new(para,'') - format_text.scr_inden_ocn_e_no_paranum - when /<:i2>/ - format_text=Format_text_object.new(para,'') - format_text.scr_inden_ocn_e_no_paranum - end - end - if para !~/#{@vz.margin_txt_0}|#{@vz.margin_txt_1}|#{@vz.margin_txt_2}/ # where condition for no paranum - end - if para =~/<:center>/ - one,two=/(.*)<:center>(.*)/.match(para)[1,2] - format_text=Format_text_object.new(one,two) - para=format_text.center - end - else - end - para.gsub!(/<:\S+?>/,'') - para.gsub!(/<!.+!>/,' ') - end - end - @content_flag=true - 6.downto(4) do |x| - y=x - 1; v=x - 3 - if @level[x] == true - if @content_flag==true - @@xml[:body] << "#{@tab*5}</content>\n#{@tab*y}</contents#{v}>\n" - @content_flag=false - else - @@xml[:body] << "\n#{@tab*y}</contents#{v}>\n" - end - end - end - 3.downto(1) do |x| - y=x - 1 - @@xml[:body] << "#{@tab*y}</heading#{x}>\n" if @level[x] == true - end - #6.downto(1) { |x| y=x - 1; @@xml[:body] << "#{@tab*y}</level #{x}>\n" if @level[x] == true } - end - def pre - rdf=SiSU_XML_tags::RDF.new(@md) - dir=SiSU_Env::Info_env.new - @@xml[:head],@@xml[:body]=[],[] - css=SiSU_Env::CSS_select.new(@md).xml_sax - encoding=if @sys.locale =~/utf-?8/i; '<?xml version="1.0" encoding="UTF-8" standalone="no"?>' - else '<?xml version="1.0" encoding="ISO-8859-1" standalone="no"?>' - end - @@xml[:open] =<<WOK -#{encoding} -<?xml-stylesheet type="text/css" href="../#{dir.path.style}/#{css}"?> -#{rdf.comment_xml_dom} -<document> -WOK - @@xml[:head] << "<head>\n" - @@xml[:body] << "<body>\n" - end - def post - @@xml[:head] << @@xml[:sc] - @@xml[:head] << "</head>\n" - @@xml[:body] << "</body>\n" - @@xml[:close] = "</document>\n" - end - def publish - content=[] - data=@data - content << @@xml[:open] << @@xml[:head] << @@xml[:body] << @@xml[:metadata] - content << @@xml[:owner_details] if @md.stmp =~/\w\w/ - content << @@xml[:tail] << @@xml[:close] - Output.new(content.to_s,@md).xml - @@xml={} - end - end - class Output - include SiSU_Param - include SiSU_Env - def initialize(data,md) - @data,@md=data,md - end - def xml - @sisu=[] - @data.each do |para| - para.gsub!(/\/\{(.+?)\}\//,'<italic>\1</italic>') - para.gsub!(/\*\{(.+?)\}\*/,'<bold>\1</bold>') - para.gsub!(/!\{(.+?)\}!/,'<bold>\1</bold>') - para.gsub!(/_\{(.+?)\}_/,'<underscore>\1</underscore>') - para.gsub!(/-\{(.+?)\}-/,'<strike>\1</strike>') - # do { links }http://url - para.gsub!(/<:\S+?>/,'') - para.gsub!(/<!.+?!>/,'') - para="#{para}\n" unless para.empty? - @sisu << para - end - new_file_data=@sisu.to_s - @sisu=new_file_data.scan(/.+/) - SiSU_Env::SiSU_file.new(@md).mkdir - filename_sxm=SiSU_Env::SiSU_file.new(@md,@md.fn[:sxd]).mkfile_pwd - if filename_sxm.class == File - @sisu.each {|para| filename_sxm.puts para} - filename_sxm.close - else puts 'file not created, is directory writable?' - end - end - end - class Tidy - def initialize(md,dir) - @md,@env=md,dir - @prog=SiSU_Env::Info_program.new - end - def xml - if @prog.tidy !=false #note values can be other than true - if @md.cmd =~/[VM]/ - tell=SiSU_Screen::Ansi.new(@md.cmd,'invert','Using XML Tidy','check document structure') - tell.colorize unless @md.cmd =~/q/ - tell.grey_open unless @md.cmd =~/q/ - tidyfile='/dev/null' #don't want one or screen output, check for alternative flags - tidy =SiSU_Env::System_call.new("#{Dir.pwd}/#{@md.fn[:sxd]}",tidyfile) - tidy.well_formed? - tell.p_off unless @md.cmd =~/q/ - end - end - end - end - end -end -__END__ |