From 0e6fc15ada3c5d9a86b227163f35a54993b32529 Mon Sep 17 00:00:00 2001 From: Ralph Amissah Date: Tue, 2 Dec 2008 23:54:23 -0500 Subject: sisu harvest, introduce module along with header syntax addition & modification * sisu markup, additional header and new format rule: * @creator: / @author: header field, introduced author name format rules for more usable metadata harvesting: surname comma other names, additional authors separated by semi-colon * param added meta-tag, @topic_register: formatting topic levels are separated from sub-levels by a colon, a semi-colon separates main topics if there are multiple topics at lowest sub-level, a pipe can be used to create multiple headings * harvest module, harvests metadata from document set currently extracts: (i) authors and their writings from document set; (ii) topics and associated writings from document set (topics use topic_register header). harvest (when run against documents common to a directory of a site) extracts metadata and organises the documents on a site by author and topic information provided (there is a new "topic_register" header, with formatting rules similar to those of the book index), results are placed in [output_path]/sisu_site_metadata. sisu --harvest *.sst * by author (see change in param @creator: / @author: header field) * by topic / subject index (see addition in param of @topic_register: header field) initially there should be an example samples here: http://www.jus.uio.no/sisu/sisu_site_metadata/harvest_authors.html http://www.jus.uio.no/sisu/sisu_site_metadata/harvest_topics.html together with update markup source files The authors and their writings list will be made to take on a more biblographical form, with the use of additional fields as required. (concept example, suitable for medium sized sites [to remove size constraint: implement SQL equivalent]) make feature more robust * css, for harvest output added * remote placement of sisu_site_metadata (output produced by metadata harvest) * sisu markup, update document samples accordingly * tidy copyright marks in program headers, remove repetition of dates [version bump because formatting rule introduced to author / creator header - where new site metadata harvest feature is used, (at present changes changes should not be noticed except when using metadata harvest)] --- lib/sisu/v0/remote.rb | 84 ++++++++++++++++++++++++++++++++++++++++----------- 1 file changed, 67 insertions(+), 17 deletions(-) (limited to 'lib/sisu/v0/remote.rb') diff --git a/lib/sisu/v0/remote.rb b/lib/sisu/v0/remote.rb index 4cfa9347..ea50f3bb 100644 --- a/lib/sisu/v0/remote.rb +++ b/lib/sisu/v0/remote.rb @@ -14,8 +14,7 @@ SiSU, a framework for document structuring, publishing and search - Copyright (C) 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006, - 2007, 2008 Ralph Amissah + Copyright (C) Ralph Amissah This program is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free @@ -71,26 +70,11 @@ module SiSU_Remote end @remote=SiSU_Env::Info_remote.new(@opt) end - def scp - tell=SiSU_Screen::Ansi.new(@opt.cmd,'Remote placement ->',@put) - tell.dark_grey_title_hi unless @opt.cmd =~/q/ - @remote.scp - end def rsync tell=SiSU_Screen::Ansi.new(@opt.cmd,'Remote placement ->',@put) tell.dark_grey_title_hi unless @opt.cmd =~/q/ @remote.rsync end - def scp_base - tell=SiSU_Screen::Ansi.new(@opt.cmd,'Remote placement of base site ->','excluding images') - tell.dark_grey_title_hi unless @opt.cmd =~/q/ - @remote.scp_base - end - def scp_base_all - tell=SiSU_Screen::Ansi.new(@opt.cmd,'Remote placement ->','complete') - tell.dark_grey_title_hi unless @opt.cmd =~/q/ - @remote.scp_base_all - end def rsync_base tell=SiSU_Screen::Ansi.new(@opt.cmd,'Remote placement ->','rsync') tell.dark_grey_title_hi unless @opt.cmd =~/q/ @@ -106,6 +90,72 @@ module SiSU_Remote tell.dark_grey_title_hi unless @opt.cmd =~/q/ @remote.rsync_sitemaps end + def rsync_harvest + tell=SiSU_Screen::Ansi.new(@opt.cmd,'Remote placement metadata harvest ->','rsync_harvest') + tell.dark_grey_title_hi unless @opt.cmd =~/q/ + @remote.rsync_harvest + end + def scp + tell=SiSU_Screen::Ansi.new(@opt.cmd,'Remote placement ->',@put) + tell.dark_grey_title_hi unless @opt.cmd =~/q/ + @remote.scp + end + def scp_base + tell=SiSU_Screen::Ansi.new(@opt.cmd,'Remote placement of base site ->','excluding images') + tell.dark_grey_title_hi unless @opt.cmd =~/q/ + @remote.scp_base + end + def scp_base_all + tell=SiSU_Screen::Ansi.new(@opt.cmd,'Remote placement ->','complete') + tell.dark_grey_title_hi unless @opt.cmd =~/q/ + @remote.scp_base_all + end + #def rsync + # def do #rsync + # tell=SiSU_Screen::Ansi.new(@opt.cmd,'Remote placement ->',@put) + # tell.dark_grey_title_hi unless @opt.cmd =~/q/ + # @remote.rsync + # end + # def base + # tell=SiSU_Screen::Ansi.new(@opt.cmd,'Remote placement ->','rsync') + # tell.dark_grey_title_hi unless @opt.cmd =~/q/ + # @remote.rsync_base + # end + # def base_sync + # tell=SiSU_Screen::Ansi.new(@opt.cmd,'Remote placement ->','rsync and sync') + # tell.dark_grey_title_hi unless @opt.cmd =~/q/ + # @remote.rsync_base_sync + # end + # def sitemaps + # tell=SiSU_Screen::Ansi.new(@opt.cmd,'Remote placement sitemaps ->','rsync') + # tell.dark_grey_title_hi unless @opt.cmd =~/q/ + # @remote.rsync_sitemaps + # end + # def harvest + # tell=SiSU_Screen::Ansi.new(@opt.cmd,'Remote placement metadata harvest ->','rsync') + # tell.dark_grey_title_hi unless @opt.cmd =~/q/ + # @remote.rsync_harvest + # end + # self + #end + #def scp + # def do #scp + # tell=SiSU_Screen::Ansi.new(@opt.cmd,'Remote placement ->',@put) + # tell.dark_grey_title_hi unless @opt.cmd =~/q/ + # @remote.scp + # end + # def scp_base + # tell=SiSU_Screen::Ansi.new(@opt.cmd,'Remote placement of base site ->','excluding images') + # tell.dark_grey_title_hi unless @opt.cmd =~/q/ + # @remote.scp_base + # end + # def scp_base_all + # tell=SiSU_Screen::Ansi.new(@opt.cmd,'Remote placement ->','complete') + # tell.dark_grey_title_hi unless @opt.cmd =~/q/ + # @remote.scp_base_all + # end + # self + #end end class Get def initialize(opt,get_s) -- cgit v1.2.3