=begin * Name: SiSU information Structuring Universe - Structured information, Serialized Units * Author: Ralph Amissah * http://www.jus.uio.no/sisu * http://www.jus.uio.no/sisu/SiSU/download.html * Description: document digests (md5|sha256) and structure processing * Copyright (C) 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006, 2007 Ralph Amissah * License: GPL 2 or later Summary of GPL 2 This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA If you have Internet connection, the latest version of the GPL should be available at these locations: http://www.fsf.org/licenses/gpl.html http://www.gnu.org/copyleft/gpl.html http://www.jus.uio.no/sisu/gpl2.fsf SiSU was first released to the public on January 4th 2005 SiSU uses: * Standard SiSU markup syntax, * Standard SiSU meta-markup syntax, and the * Standard SiSU object citation numbering and system © Ralph Amissah 1997, current 2007. All Rights Reserved. * Notes: tidy -ascii index.xml >> index.tidy * Ralph Amissah: ralph@amissah.com ralph.amissah@gmail.com =end module SiSU_Digest_view require "#{SiSU_lib}/dal" require "#{SiSU_lib}/sysenv" require "#{SiSU_lib}/i18n" include SiSU_Env include SiSU_Param include SiSU_Viz pwd=Dir.pwd class Source @@dg=nil def initialize(opt) @opt=opt @fnb=@opt.fnb @@endnotes_para=[] @@dg=nil @dg=@@dg ||=SiSU_Env::Info_env.new.digest.type @env=SiSU_Env::Info_env.new(@opt.fns) end def read begin @md=SiSU_Param::Parameters.new(@opt).get tool=if @opt.cmd =~/[MVv]/; "#{@env.program.text_editor} #{@env.path.output_tell}/#{@md.fnb}/#{@md.fn[:digest]}" else '' end tell=SiSU_Screen::Ansi.new(@opt.cmd,"Document #@dg Digests",tool) tell.green_hi_blue unless @opt.cmd =~/q/ tell=SiSU_Screen::Ansi.new(@opt.cmd,@opt.fns,"#{@env.path.output_tell}/#{@md.fnb}/#{@md.fn[:digest]}") tell.flow if @opt.cmd =~/[MV]/ my_make=SiSU_Env::Create_file.new(@opt.cmd,@opt.fns) @dal_array=SiSU_DAL::Source.new(@opt).get # dal file drawn here SiSU_Digest_view::Source::Scroll.new(@dal_array,@md).songsheet SiSU_Env::Info_skin.new(@md).select rescue; SiSU_Errors::Info_error.new($!,$@,@opt.cmd,@opt.fns).error ensure end end private class Scroll <([0-9a-f]{#@dl}):([0-9a-f]{#@dl})>/ ocn,h1,h2,d_clean,d_all=$1,$2,$3,$4,$5 @ocn=ocn unless ocn.to_i == 0 if para=~/~\{[\d*+]+.+?<[0-9a-f]{#@dl}>\}~/ para_endnotes << para.scan(/~[{\[]([\d*+]+).+?<([0-9a-f]{#@dl})>[}\]]~/) end ima=[] if para =~/\{(\S+\.(png|jpg|gif))\s.+?\}(?:(?:https?|ftp):\/\/\S+|image)/ images=para.scan(/\{(\S+\.(?:png|jpg|gif))\s.+?\}(?:(?:https?|ftp):\/\/\S+|image)/).flatten else image=nil end x=case para when /^0~title/ "\n" + ' '*0 +'@' + ' '*9 when /^0~subtitle/ "\n" + ' '*1 +'@' + ' '*8 when /^1~/ "\n" + ' '*2 +':A ' + ' '*6 +'- ' + ocn + ' '*(10-ocn.length) + d_clean + ' ' + d_all when /^2~/ "\n" + ' '*3 +':B ' + ' '*5 +'- ' + ocn + ' '*(10-ocn.length) + d_clean + ' ' + d_all when /^3~/ "\n" + ' '*4 +':C ' + ' '*4 +'- ' + ocn + ' '*(10-ocn.length) + d_clean + ' ' + d_all when /^4~/ "\n" + ' '*5 +'1' + ' '*4 +'- ' + ocn + ' '*(10-ocn.length) + d_clean + ' ' + d_all when /^5~/ "\n" + ' '*6 +'2' + ' '*3 +'- ' + ocn + ' '*(10-ocn.length) + d_clean + ' ' + d_all when /^6~/ "\n" + ' '*7 +'3' + ' '*2 +'- ' + ocn + ' '*(10-ocn.length) + d_clean + ' ' + d_all else if para =~/MD5\(\S+?\.sst\)=\s*([0-9a-f]{#@dl})<\/u>/ #watch @n,@s=/MD5\((\S+?\.sst)\)=\s*([0-9a-f]{#@dl})<\/u>/.match(para)[1,2] end x=unless ocn =~ /^0$/ if images and images.length > 0 # then get path of image & produce digest @image_name,@image_dgst,@img=[],[],[] images.each do |i| image_source=if FileTest.file?("#{@env.path.image_source_local_tex}/#{i}") @env.path.image_source_local_tex elsif FileTest.file?("#{@env.path.image_source_remote_tex}/#{i}") @env.path.image_source_remote_tex elsif FileTest.file?("#{@env.path.image_source_tex}/#{i}") @env.path.image_source_tex else tell=SiSU_Screen::Ansi.new(@md.cmd,"ERROR - image:", %{"#{i}" missing}, "search locations: #{@env.path.image_source_local_tex}, #{@env.path.image_source_remote_tex} and #{@env.path.image_source_tex}") tell.error2 unless @md.cmd =~/q/ nil end @img << /\S+\.(png|jpg|gif)/.match(i)[1] not_found_msg='image not found' if image_source para_image = image_source + '/' + i @image_name << i @image_dgst << if @dg =~/^sha(?:2|256)$/; sys.sha256(para_image) else sys.md5(para_image) end else @image_name << ' '*16 + i + ' [image missing]' @image_dgst << '' @image_dgst[1]=not_found_msg + ' '*(32-not_found_msg.length) end end line= "\n" + ' '*9 + ' - ' + ocn + ' '*(10-ocn.length) + d_clean + ' ' + d_all + "\n" line_image=[] c=0 @image_name.each do |ok| line_image << %{ #{@img[c]} #{@image_dgst[c][1]} #{@image_name[c]}} c +=1 end line=line + line_image.join("\n") else "\n" + ' '*9 + ' - ' + ocn + ' '*(10-ocn.length) + d_clean + ' ' + d_all end else prefix='' metad=[@tr.dc_title,@tr.creator,@tr.translator,@tr.illustrator,@tr.prepared_by,@tr.digitized_by,@tr.description,@tr.subject,@tr.abstract,@tr.publisher,@tr.contributor,@tr.date_created,@tr.date_issued,@tr.date_available,@tr.date_modified,@tr.date_valid,@tr.date,@tr.type,@tr.format,@tr.rights,@tr.identifier,@tr.source,@tr.language,@tr.language_original,@tr.relation,@tr.coverage,@tr.keywords,@tr.comments,@tr.cls_loc,@tr.cls_dewey,@tr.cls_gutenberg,@tr.cls_isbn,@tr.prefix_a,@tr.prefix_b,@tr.sourcefile,@tr.sourcefile_digest,@tr.last_generated,@tr.sisu_version,@tr.ruby_version,@tr.sc_number,@tr.sc_date,'Skin_Digest: ','Generated by: ','Ruby version: '] metad.each do |n| m=rgx_txt(n) if m=~/\S+/ and para=~/^#{m}:/ x,o=0,18 while x < 2; o = o + 2 x=o - n.length end space=' '*x prefix="#{n.downcase}#{space}" break else prefix=' '*9 end end m_dc_title=rgx_txt(@tr.dc_title) m_creator=rgx_txt(@tr.creator) m_sourcefile_digest=rgx_txt(@tr.sourcefile_digest) m_sisu_version=rgx_txt(@tr.sisu_version) m_last_generated=rgx_txt(@tr.last_generated) m_ruby_version=rgx_txt(@tr.ruby_version) case para when /#{m_dc_title}: / @t=/#{m_dc_title}: (.+?)<~\d;(?:\w|[0-6]:)\d+;\w\d+><[0-9a-f]{#@dl}:[0-9a-f]{#@dl}>/.match(para)[1].gsub(/<\/?u>/,'').strip when /#{m_creator}: / @c=/#{m_creator}: (.+?)<~\d;(?:\w|[0-6]:)\d+;\w\d+><[0-9a-f]{#@dl}:[0-9a-f]{#@dl}>/.match(para)[1].gsub(/<\/?u>/,'').strip when /#{m_sourcefile_digest}.+?/ #watch dgst_extra="\n" + ' '*21 +'source' +' '*4 + @md.dgst[1] + ' '*34 + @md.fns when /Skin_Digest: / dgst_extra="\n" + ' '*21 + 'skin' +' '*6 + @md.dgst_skin[1] + ' '*34 + /(skin_\S+?\.rb)/.match(@md.dgst_skin[0])[1] when /#{m_sisu_version}: / @v=/#{m_sisu_version}: (.+?)<~\d;(?:\w|[0-6]:)\d+;\w\d+><[0-9a-f]{#@dl}:[0-9a-f]{#@dl}>/.match(para)[1].gsub(/<\/?u>/,'').strip when /#{m_last_generated}: / @g=/#{m_last_generated}: (.+?)<~\d;(?:\w|[0-6]:)\d+;\w\d+><[0-9a-f]{#@dl}:[0-9a-f]{#@dl}>/.match(para)[1].gsub(/<\/?u>/,'').strip # 'doc last generated' when /#{m_ruby_version}: / @r=/#{m_ruby_version}: (.+?)<~\d;(?:\w|[0-6]:)\d+;\w\d+><[0-9a-f]{#@dl}:[0-9a-f]{#@dl}>/.match(para)[1].gsub(/<\/?u>/,'').strip end dgst_extra ||='' "\n" + prefix +' - ' + ocn + ' '*(10-ocn.length) + d_clean + ' ' + d_all + dgst_extra + "\n" end end para_endnotes[0].each { |e| y << "\n" + ' '*(28-e[0].length) + "[#{e[0].to_s}] #{e[1].to_s}" } if para_endnotes[0] if y; digests(x,y) else digests(x) end end end manifest="#{@env.url.root}/#{@md.fnb}/sisu_manifest.html" a=%{level (if any), ocn: digest clean (no markup/notes), digest all (includes markup & endnotes)\n [endnote number] endnote digest clean\n} description("#@t\n") description("#@c\n") description("#{@md.fns}\n") description("----------------------------------------------\n") description("SiSU Document Content Certificate (Digest/DCC)\n") description("----------------------------------------------\n") description(" #@dg digests\n") description("------------\n") description("Sourcefile digest: #@s\n") description(" source filename: #@n\n") description("available outputs: #{manifest}\n") description(" time generated: #@g\n") description(" SiSU version used: #@v\n") description(" Ruby version used: #@r\n") description("------------\n") description("Document Digest Tree (from dal):\n") description(a) #digests("------------\n") #digests("#@v\n") #digests("#@g\n") #digests("#@r\n") end def dal_structure #there will be a docubook mapping header, fairly complex variations data=@data l=Hash.new(0) dal_structure1("------------\n") dal_structure1("document structure[*]\n") ocn,endnotes=nil,nil data.each do |para| x=case para when /^0~/; l[0] +=1 if para =~/^0~title/; '' #' '*0 +'@ == headers' + "\n" + ' '*0 +'headings:' end when /^1~/; l[1] +=1 ' '*0 +':A' when /^2~/; l[2] +=1 ' '*1 +':B' when /^3~/; l[3] +=1 ' '*2 +':C' when /^4~/; l[4] +=1 ' '*3 +'1' when /^5~/; l[5] +=1 ' '*4 +'2' when /^6~/; l[6] +=1 ' '*5 +'3' else nil end if para =~/<~(\d+);(?:\w|[0-6]:)\d+;\w\d+><[0-9a-f]{#@dl}:[0-9a-f]{#@dl}>/ ocn=$1 unless $1.to_i == 0 end if para =~/~[{\[]([\d*+]+).+?<[0-9a-f]{#@dl}>[}\]]~/ endnotes=$1 unless $1.to_i == 0 end dal_structure1("#{x}\n") if x and not x.empty? end dal_structure1(" [*] heading levels\n") dal_structure2("------------\n") dal_structure2("document structure[*]\n") [0,1,2,3,4,5,6].each do |y| v=case y.to_s when /0/; '@ ' when /1/; ':A' when /2/; ':B' when /3/; ':C' when /4/; '1 ' when /5/; '2 ' when /6/; '3 ' end dal_structure2("#{v} = #{l[y]}\n") if l[y] > 0 end dal_structure2("objects (ocn) = #{ocn}\n") dal_structure2("endnotes = #{endnotes}\n") dal_structure2(" [*] number of headers (@) and of each heading level (:A to :C and 1 to 3)\n") end def supplementary if defined? @md.sc_number and @md.sc_number rcinfo("------------\n") rcinfo("source control information\n") rcinfo(" (the following information while not important for document content certification\n may help the publisher in locating the version referred to)\n") rcinfo(" rcs version number: #{@md.sc_number}\n") if defined? @md.sc_date and @md.sc_date rcinfo(" rcs date: #{@md.sc_date}\n") end if defined? @md.sc_time and @md.sc_time rcinfo(" rcs time: #{@md.sc_time}\n") end end rcinfo("------------\n") rcinfo("Note: the time generated related fields (text and digests) will vary between otherwise identical document outputs\n") end end end end __END__