From 306aed5b8a559aad2fb944a946ffdda9713f07ec Mon Sep 17 00:00:00 2001 From: Ralph Amissah Date: Sat, 6 Mar 2010 09:47:55 -0500 Subject: introducing version 2, major patch, (version 1 libraries retained) --- lib/sisu/v2/html_segments.rb | 517 +++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 517 insertions(+) create mode 100644 lib/sisu/v2/html_segments.rb (limited to 'lib/sisu/v2/html_segments.rb') diff --git a/lib/sisu/v2/html_segments.rb b/lib/sisu/v2/html_segments.rb new file mode 100644 index 00000000..79aa699e --- /dev/null +++ b/lib/sisu/v2/html_segments.rb @@ -0,0 +1,517 @@ +# coding: utf-8 +=begin + + * Name: SiSU + + * Description: a framework for document structuring, publishing and search + + * Author: Ralph Amissah + + * Copyright: (C) 1997 - 2010, Ralph Amissah, All Rights Reserved. + + * License: GPL 3 or later: + + SiSU, a framework for document structuring, publishing and search + + Copyright (C) Ralph Amissah + + This program is free software: you can redistribute it and/or modify it + under the terms of the GNU General Public License as published by the Free + Software Foundation, either version 3 of the License, or (at your option) + any later version. + + This program is distributed in the hope that it will be useful, but WITHOUT + ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for + more details. + + You should have received a copy of the GNU General Public License along with + this program. If not, see . + + If you have Internet connection, the latest version of the GPL should be + available at these locations: + + + + + + + + * SiSU uses: + * Standard SiSU markup syntax, + * Standard SiSU meta-markup syntax, and the + * Standard SiSU object citation numbering and system + + * Hompages: + + + + * Download: + + + * Ralph Amissah + + + + ** Description: html segment generation, processing + +=end +module SiSU_HTML_seg + require "#{SiSU_lib}/shared_html" # shared_html.rb + require "#{SiSU_lib}/html" # html.rb + require "#{SiSU_lib}/html_promo" # html_promo.rb + require "#{SiSU_lib}/shared_metadata" # shared_metadata.rb + class Seg_output + def initialize(md,outputfile,seg,minitoc,type='') + @md,@output_seg_file,@seg,@minitoc,@type=md,outputfile,seg,minitoc,type + end + def output + if @seg[:title] =~/\S/ + filename_seg=[] + filename_seg << @seg[:title] << @seg[:tocband_banner] + if @type=='endnotes' + @seg[:headings]=[] + format_head_seg=SiSU_HTML_Format::Head_seg.new(@md) + @seg[:headings] << format_head_seg.title_banner(@md.title.main,@md.title.sub,@author) + txt_obj={:txt =>'Endnotes',:ocn_display =>''} + format_seg=SiSU_HTML_Format::Format_seg.new(@md,txt_obj) + @seg[:headings] << format_seg.title_heading1 + filename_seg << @seg[:heading_endnotes] << @minitoc << @seg[:headings] << %{\n
\n} << @seg[:endnote_all] << '
' # << '' + elsif @type=='idx' + @seg[:headings]=[] + format_head_seg=SiSU_HTML_Format::Head_seg.new(@md) + @seg[:headings] << format_head_seg.title_banner(@md.title.main,@md.title.sub,@author) + txt_obj={:txt =>'Index',:ocn_display =>''} + format_seg=SiSU_HTML_Format::Format_seg.new(@md,txt_obj) + @seg[:headings] << format_seg.title_heading1 + filename_seg << @seg[:heading_idx] << @minitoc << @seg[:headings] << %{\n
\n} << @seg[:idx] << '
' # << '' + elsif @type=='metadata' + metadata=Metadata::Summary.new(@md).xhtml_display.metadata + @seg[:headings]=[] + format_head_seg=SiSU_HTML_Format::Head_seg.new(@md) + @seg[:headings] << format_head_seg.title_banner(@md.title.main,@md.title.sub,@author) + txt_obj={:txt =>'Metadata',:ocn_display =>''} + format_seg=SiSU_HTML_Format::Format_seg.new(@md,txt_obj) + @seg[:headings] << format_seg.title_heading1 + filename_seg << @seg[:heading_idx] << @minitoc << @seg[:headings] << %{\n
\n} << metadata << '
' # << '' + else + filename_seg << @minitoc << @seg[:headings] << @seg[:main] << "\n\n" + end + filename_seg << @seg[:tail] << @seg[:tocband_bannerless] << @seg[:credits] + filename_seg.flatten!.compact! + filename_seg.each do |str| + unless str =~/\A\s*\Z/ + str.strip! + @output_seg_file << str + end + end + @output_seg_file.close + end + end + end + class Seg + @@seg,@@seg_subtoc,@@seg_endnotes,@@seg_ad={},{},{},{} + @@seg_name,@@seg_name_html=[],[] + @@seg_url=@@fn=@@get_hash_to=@@get_hash_fn='' + @@loop_count=@@seg_total=@@tracker=0 + @@is4=@@is3=@@is2=@@is1=0 + @@heading1=@@heading2=@@heading3=@@heading4=0 + @@seg[:tocband_banner],@@seg[:tocband_bannerless],@@seg[:title],@@seg[:headings],@@seg[:main],@@seg[:idx],@@seg[:tail],@@seg[:credits],@@seg_subtoc_array,@@seg_endnotes_array,@@seg[:endnote_all]=Array.new(11){[]} + @@seg[:heading_endnotes]='' + @@tablehead,@@number_of_cols=0,0 + @@dp,@@segtocband=nil,nil + @@fns_previous='' + attr_reader :seg_name_html,:seg_name_html_tracker + def initialize(md='',data='') + @md,@data=md,data + @vz=SiSU_Env::Get_init.instance.skin + @seg_name_html=@@seg_name_html || nil + @seg_name_html_tracker=@@tracker || nil + end + def songsheet + begin + @minitoc=SiSU_HTML::Source::Toc.new(@md,@data).minitoc + data=get_subtoc_endnotes(@data) + data=articles(data) + Seg.new.cleanup # (((( added )))) + #### (((( END )))) #### + rescue; SiSU_Errors::Info_error.new($!,$@,@md.cmd,@md.fns).error + ensure + @@seg_name=[] + end + end + protected + def articles(data) + track,tracking,newfile=0,0,0 + @@is4=@@is3=@@is2=@@is1=0 + printed_endnote_seg='n' + idx_html=nil + if @md.book_idx + my_make_source_file=SiSU_Env::Create_file.new(@md.cmd,@md.fns) + idx_html=SiSU_Particulars::Combined_singleton.instance.get_idx_html(@md.opt).html_idx + idx_html.each {|x| @@seg[:idx] << x } + @@seg[:heading_idx]='' + end + data.each do |dob| + if (dob.is=='heading' or dob.is=='heading_insert') \ + and dob.ln==4 + @@seg_name << dob.name + seg_name=dob.name + end + end + @@seg_name_html=@@seg_name + @@seg_total=@@seg_name.length + testforartnum=@@seg_name_html + tell=SiSU_Screen::Ansi.new(@md.cmd,@@seg_name.length) + tell.segmented unless @md.cmd =~/q/ + map_nametags=SiSU_Particulars::Combined_singleton.instance.get_map_nametags(@md).nametags_map #p map_nametags + data.each do |dob| + if defined? dob.obj \ + and dob.obj =~/href="#{Xx[:segment]}#(\S+?)"/ + m=$1 + dob.obj.gsub!(/href="#{Xx[:segment]}#(\S+?)"/,%{href="#{map_nametags[m][:segname]}#{Sfx[:html]}#\\1"}) + end + if (dob.is=='heading' or dob.is=='heading_insert') \ + and dob.ln==4 + if dob.ocn==0 + @@heading4=dob.obj + else @@heading4=dob.obj + end + @@is4=newfile=1 + end + if (dob.is=='heading' or dob.is=='heading_insert') \ + and dob.ln==3 + @@heading3=dob.obj + @@is4,@@is3=0,1 + end + if (dob.is=='heading' or dob.is=='heading_insert') \ + and dob.ln==2 + @@heading2=dob.obj + @@is4,@@is3,@@is2=0,0,1 + end + if (dob.is=='heading' or dob.is=='heading_insert') \ + and dob.ln==1 + @@heading1=dob.obj + @@is4,@@is3,@@is2,@@is1=0,0,0,1 + end + if (@@is1 && !@@is2 && !@@is3 && !@@is4) + if not (dob.is=='heading' or dob.is=='heading_insert') \ + and dob.ln==1 + head1=$_ #; check + end + end + if @@is4==1 + if newfile==1 \ + or dob.obj =~/^#{Mx[:br_endnotes]}|^#{Mx[:br_eof]}/ + newfile=0 + if (dob.is=='heading' or dob.is=='heading_insert') \ + and dob.ln==4 + if tracking != 0 + mkdir_p(@md.dir_out) unless FileTest.directory?(@md.dir_out) #bug - added specifically for nav! not needed by regular seg, check !!! + Seg.new(@md).tail + segfilename="#{@md.dir_out}/#{@md.fnl[:pre]}#{@@seg_name_html[tracking-1]}#{@md.fnl[:mid]}#{Sfx[:html]}#{@md.fnl[:post]}" + output_seg_file=File.new(segfilename,'w') if @@seg_name_html[tracking-1] + if dob.is=='heading' \ + or @@seg_name_html[tracking-1] !~/endnotes|book_index|metadata/ + Seg_output.new(@md,output_seg_file,@@seg,@minitoc).output + elsif dob.is=='heading_insert' + if @@seg_name_html[tracking-1]=='endnotes' + Seg_output.new(@md,output_seg_file,@@seg,@minitoc,'endnotes').output + elsif @@seg_name_html[tracking-1]=='book_index' + Seg_output.new(@md,output_seg_file,@@seg,@minitoc,'idx').output + @@seg[:idx]=[] + elsif @@seg_name_html[tracking-1]=='metadata' + Seg_output.new(@md,output_seg_file,@@seg,@minitoc,'metadata').output + else puts "#{__FILE__}::#{__LINE__}" + end + else puts "#{__FILE__}::#{__LINE__}" + end + Seg.new.reinitialise + heading_art(dob) + head(dob) + #keep use for last segment, eg if metadata is last segment + #if @@seg_name_html[tracking] =~/metadata/ # this is for metadata + # segfilename="#{@md.dir_out}/#{@md.fnl[:pre]}#{@@seg_name_html[tracking]}#{@md.fnl[:mid]}#{Sfx[:html]}#{@md.fnl[:post]}" + # output_seg_file=File.new(segfilename,'w') + # Seg_output.new(@md,output_seg_file,@@seg,@minitoc,'metadata').output + # Seg.new.reinitialise + #end + end + if tracking==0 + heading_art(dob) + head(dob) + end + end + tracking=tracking+1 + end + @@get_hash_to=dob.name if (dob.is=='heading' or dob.is=='heading_insert') and dob.ln==4 and dob.name + @@get_hash_fn=dob.name if (dob.is=='heading' or dob.is=='heading_insert') and dob.ln==4 and dob.name + if dob.obj.class==String + markup(dob) + elsif dob.obj.class==Array + dob.obj.each do |pg| + markup(pg) + end + end + if testforartnum[tracking-1] =~/endnote/ + if printed_endnote_seg=='n' + printed_endnote_seg='y' + end + end + end + end + data + end + def heading_art(dob) + format_head_seg=SiSU_HTML_Format::Head_seg.new(@md) + if (dob.is=='heading' or dob.is=='heading_insert') \ + and dob.ln.to_s =~/^[1-6]/ + if @@tracker < @@seg_total-1; @@seg[:dot_nav]=format_head_seg.dot_control_pre_next + else @@seg[:dot_nav]=format_head_seg.dot_control_pre + end + end + ads=SiSU_HTML_promo::Ad.new(@md) + @@seg[:title]=format_head_seg.head << ads.div.major + end + def head(dob) + clean=/|<:.*?>/ + format_head_seg=SiSU_HTML_Format::Head_seg.new(@md) + if @@tracker < @@seg_total-1 + if @@tracker==0; @@segtocband=format_head_seg.toc_next2 #if format_head_seg.toc_next2 + else @@segtocband=format_head_seg.toc_pre_next2 #if format_head_seg.toc_pre_next2 + end + else @@segtocband=format_head_seg.toc_pre2 #if format_head_seg.toc_pre2 + end + @p_num ||= '' + if @@is1==1 + @author=%{#{@md.author}\n} if @md.author.to_s =~/\S/ + @@seg[:tocband_banner] << format_head_seg.navigation_band(@@segtocband,@@seg[:dot_nav]) + conditional_div_close=if @@get_hash_fn =~/metadata/ #watch + '' + else '' + end + @@seg[:tocband_bannerless] << conditional_div_close << format_head_seg.navigation_band_bottom(@@segtocband,@@seg[:dot_nav]) + @@seg[:headings] << format_head_seg.seg_head_escript if SiSU_HTML_Format::Head_seg.method_defined? :seg_head_escript #debug PHP move up in text #bug + @@seg[:headings] << format_head_seg.title_banner(@md.title.main,@md.title.sub,@author).gsub(clean,'') + ocn=if @@heading1[/.+?#{Mx[:id_o]}~(\d+);(?:[oh]|[0-6]:)\d+;\w\d+#{Mx[:id_c]}#{Mx[:id_o]}#{@dp}:#{@dp}#{Mx[:id_c]}$/]; $1 #fix + else '' + end + @p_num=SiSU_HTML_Format::Paragraph_number.new(@md,ocn) + txt_obj={:txt =>@@heading1,:ocn_display =>@p_num.ocn_display} + format_seg=SiSU_HTML_Format::Format_seg.new(@md,txt_obj) + @@seg[:headings] << format_seg.title_heading1.gsub(clean,'') + @@heading1.gsub!(/  [\d*+]+<\/sup> <\/a>/,'') + end + if @@is2==1 + heading2=@@heading2 + ocn=if heading2[/.+?#{Mx[:id_o]}~(\d+);(?:[oh]|[0-6]:)\d+;\w\d+#{Mx[:id_c]}#{Mx[:id_o]}#{@dp}:#{@dp}#{Mx[:id_c]}$/]; $1 #fix + else '' + end + @p_num=SiSU_HTML_Format::Paragraph_number.new(@md,ocn) + txt_obj={:txt =>heading2,:ocn_display =>@p_num.ocn_display} + format_seg=SiSU_HTML_Format::Format_seg.new(@md,txt_obj) + @@seg[:headings] << format_seg.title_heading2.gsub(clean,'') + @@heading2.gsub!(/  [\d*+]+<\/sup> <\/a>/,'') + end + if @@is3==1 + heading3=@@heading3 + ocn=if heading3[/.+?#{Mx[:id_o]}~(\d+);(?:[oh]|[0-6]:)\d+;\w\d+#{Mx[:id_c]}#{Mx[:id_o]}#{@dp}:#{@dp}#{Mx[:id_c]}$/]; $1 #fix + else '' + end + @p_num=SiSU_HTML_Format::Paragraph_number.new(@md,ocn) + txt_obj={:txt =>heading3,:ocn_display =>@p_num.ocn_display} + format_seg=SiSU_HTML_Format::Format_seg.new(@md,txt_obj) + @@seg[:headings] << format_seg.title_heading3.gsub(clean,'') + @@heading3.gsub!(/  [\d*+]+<\/sup> <\/a>/,'') + end + if @@is4==1 + heading4=@@heading4 + ocn=if heading4[/.+?#{Mx[:id_o]}~(\d+);(?:[oh]|[0-6]:)\d+;\w\d+#{Mx[:id_c]}#{Mx[:id_o]}#{@dp}:#{@dp}#{Mx[:id_c]}$/]; $1 #fix + else '' + end + @p_num=SiSU_HTML_Format::Paragraph_number.new(@md,ocn) + txt_obj={:txt =>heading4,:ocn_display =>@p_num.ocn_display} + format_seg=SiSU_HTML_Format::Format_seg.new(@md,txt_obj) + @@seg[:headings] << format_seg.title_heading4.gsub(clean,'') + end + @@tracker=@@tracker+1 + end + def markup(dob) + @debug=[] + dob.obj.gsub!(/(?:\s*#{Mx[:br_page]}\s*|\s*#{Mx[:br_page_new]}\s*)+/m,'') + format_head_seg=SiSU_HTML_Format::Head_seg.new(@md) + if dob.is !~/meta/ + if dob.is =~/(?:heading|para)/ #extend as necessary FIX + @p_num=SiSU_HTML_Format::Paragraph_number.new(@md,dob.ocn) + end + sto=SiSU_HTML_Format::Format_text_object.new(@md,dob) + dob_html=if dob.is =~/heading|para/ + dob_html=if (dob.is=='heading' \ + or dob.is=='heading_insert') + x=if dob.ln==4 + sto.seg_heading4 + elsif dob.ln==5 + sto.seg_heading5 + elsif dob.ln==6 + sto.seg_heading6 + end + elsif dob.is=='para' + if dob.indent \ + and dob.indent =~/[1-9]/ + if dob.bullet_ + sto.format('li',"i#{dob.indent}") + else sto.format('p',"i#{dob.indent}") + end + else + if dob.bullet_ + sto.format('li','bullet') + else sto.para + end + end + end + elsif dob.is=='group' + sto.group + elsif dob.is=='alt' + sto.alt + elsif dob.is='verse' + sto.verse + elsif dob.is=='code' + sto.code + elsif dob.is=='table' + sto.table + end + if @md.flag_separate_endnotes + dob.obj.gsub!(/"\s+href="#_(\d+)">/,%{" href=\"endnotes#{Sfx[:html]}#_\\1">}) #endnote- twice #removed file type + end + if dob.obj !~/#{@vz.margin_txt_w1}|#{@vz.margin_txt_w2}/ + if dob.is =~/heading|para/ and (not dob.ocn or dob.ocn.to_s.empty?) + format_seg=SiSU_HTML_Format::Format_seg.new(@md,dob) + end + dob.obj.gsub!(/\s*(-\{{2}~\d+|<:e[:_]\d+>).*/,'') #potentially dagerous - removes all paragraphs with #?? workpoint + if dob.obj =~/ / #endnote- note- + format_seg=SiSU_HTML_Format::Format_seg.new(@md,dob) + dob=format_seg.no_paranum + end + end + if (dob.is=='heading' or dob.is=='heading_insert') \ + and dob.ln==4 + @@seg[:main] << %{\n
\n} + @@seg[:main] << dob_html + @@seg[:main] << @@seg_subtoc[@@get_hash_fn] #% insertion of sub-toc + else + @@seg[:main] << dob_html #unless @@flag_alt==true + end + end + end + def tail + format_head_seg=SiSU_HTML_Format::Head_seg.new(@md) + if @md.flag_auto_endnotes and @@seg_endnotes[@@get_hash_fn] + @@seg[:tail] << %{\n
\n
\n} + if @@seg_endnotes[@@get_hash_fn].flatten.length > 0 + @@seg[:tail] << format_head_seg.endnote_mark + @@seg[:tail] << @@seg_endnotes[@@get_hash_fn].flatten #endnotes deposited at end of individual segments ||@|EXTRACTION OF ENDNOTES| + end + @@seg[:tail] << '
' + @@seg[:tail] << '
' #this div closes div class content + end + ads=SiSU_HTML_promo::Ad.new(@md) + @@seg[:credits] << format_head_seg.credit << ads.div.close << ads.display << format_head_seg.html_close + end + def reinitialise + @@seg[:title],@@seg[:dot_nav],@@seg[:tocband_banner],@@seg[:tocband_bannerless],@@seg[:headings],@@seg[:main],@@seg[:tail],@@seg[:credits]=Array.new(8){[]} + @@segtocband=nil + end + def cleanup + reinitialise + @@seg_total,@@tracker=0,0 + @@seg_endnotes,@@seg_subtoc={},{} + @@seg_endnotes_array,@@seg_subtoc_array=[],[] + @@seg[:endnote_all]=[] + end + def get_subtoc_endnotes(data) #get endnotes & sub-table of contents subtoc + data.each do |dob| + dob.obj.gsub!(/
(.+?)<\/a>/mi,'\1') + if @md.flag_auto_endnotes + if (dob.is=='heading' or dob.is=='heading_insert') \ + and dob.ln.to_s =~/^[1234]/ \ + and not @@fn.to_s.empty? + @@seg_endnotes[@@fn]=[] + @@seg_endnotes[@@fn] << @@seg_endnotes_array + @@seg_endnotes_array=[] if dob.ln==4 + @@fns_previous=@md.fns if dob.ln==4 and dob.name =~/^meta/ + end + if (dob.is=='heading' or dob.is=='heading_insert') \ + and dob.ln==4 #% EXTRACTION OF SUB-TOCs & SEGMENT NAME, after EXTRACTION OF ENDNOTES & SUB-TOCs + @@seg_subtoc[@@fn]=@@seg_subtoc_array + @@seg_subtoc_array=[] + if dob.name \ + and dob.obj + @@fn=dob.name + else + if dob.name =~/\S+/ + @@fn=dob.name + else @@fn='' + end + end + end + end + if dob.is=='heading' \ + and dob.ln.to_s =~/^[56]/ + case dob.ln + when 5 + txt_obj={:txt =>dob.obj.strip,:ocn =>dob.ocn} + format_seg=SiSU_HTML_Format::Format_seg.new(@md,txt_obj) + subtoc=format_seg.subtoc_lev5 #keep and make available, this is the subtoc + when 6 + txt_obj={:txt =>dob.obj.strip,:ocn =>dob.ocn} + format_seg=SiSU_HTML_Format::Format_seg.new(@md,txt_obj) + subtoc=format_seg.subtoc_lev6 #keep and make available, this is the subtoc + end + @@seg_subtoc_array << subtoc + end + if @md.flag_auto_endnotes + if dob.obj =~/(?:#{Mx[:en_a_o]}|#{Mx[:en_b_o]})[\d*+]+ /) + try.each do |e| + txt_obj={:txt =>e} + format_seg=SiSU_HTML_Format::Format_seg.new(@md,txt_obj) + note_match=if e =~/#{Mx[:pa_o]}i[1-9]#{Mx[:pa_c]}/ + format_seg.endnote_body_indent + else format_seg.endnote_body + end + @@seg_endnotes_array << note_match + end + try.join('
') + #% creation of separate end segment/page of all endnotes referenced back to reference segment + m=/(?:#{Mx[:en_a_o]}[\d*+]+|#{Mx[:en_b_o]}[*+]\d+)\s+(.+?href=")(#-[\d*+]+".+)(?:#{Mx[:en_a_c]}|#{Mx[:en_b_c]})/mi + endnote_part_a=note_match_seg[m,1] + endnote_part_b=note_match_seg[m,2] + txt_obj={:endnote_part_a =>endnote_part_a,:endnote_part_b =>endnote_part_b} + format_seg=SiSU_HTML_Format::Format_seg.new(@md,txt_obj) + note_match_all_seg=format_seg.endnote_seg_body(@@fn) #BUG WATCH 200408 + @@seg[:endnote_all] << note_match_all_seg + end + dob.obj.gsub!(/(?:#{Mx[:en_a_o]}.+?#{Mx[:en_a_c]}|#{Mx[:en_b_o]}.+?#{Mx[:en_b_c]})\s*/m,' ') + end + end + end + end + end +end +__END__ -- cgit v1.2.3