# encoding: utf-8
=begin
* Name: SiSU
* Description: a framework for document structuring, publishing and search
* Author: Ralph Amissah
* Copyright: (C) 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006,
2007, 2008, 2009, 2010, 2011, 2012 Ralph Amissah, All Rights Reserved.
* License: GPL 3 or later:
SiSU, a framework for document structuring, publishing and search
Copyright (C) Ralph Amissah
This program is free software: you can redistribute it and/or modify it
under the terms of the GNU General Public License as published by the Free
Software Foundation, either version 3 of the License, or (at your option)
any later version.
This program is distributed in the hope that it will be useful, but WITHOUT
ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
more details.
You should have received a copy of the GNU General Public License along with
this program. If not, see .
If you have Internet connection, the latest version of the GPL should be
available at these locations:
* SiSU uses:
* Standard SiSU markup syntax,
* Standard SiSU meta-markup syntax, and the
* Standard SiSU object citation numbering and system
* Hompages:
* Download:
* Ralph Amissah
** Description: epub generation, epub pre-processing
=end
require_relative 'param'
module SiSU_EPUB_Tune
require_relative 'sysenv' # sysenv.rb
include SiSU_Env; include SiSU_Screen
require_relative 'epub_format' # epub_format.rb #watch
@@line_mode=''
@@endnote_array=[]
@@endnote_call_counter=1
@@table_align='
 \; |
'
@@table_align_close=' |
|
'
@@counter,@@column,@columns=0,0,0
class Output
def initialize(data,md)
@data,@md=data,md
@file=SiSU_Env::FileOp.new(@md)
@cX=SiSU_Screen::Ansi.new(@md.opt.cmd).cX
end
def hard_output
@filename_tune=@file.write_file_processing.html_tune
data=[]
@data.each {|x| x.obj.strip; data << x if not x.obj.empty?} #1.9 array?
data.each do |dob|
@filename_tune.puts dob, "\n" #check
end
end
def marshal
File.open(@file.marshal.html_tune,'w') {|f| Marshal.dump(@data.to_a,f)}
end
end
class CleanXHTML
def initialize(html='')
@html=html
end
def clean
html=@html
str=if html.is_a?(String)
html
else html.obj
end
str=str.gsub(/#{Mx[:gl_o]}(#[0-9]{3})#{Mx[:gl_c]}/u,'&\1;').
gsub(/#{Mx[:gl_o]}#([a-z]{2,4})#{Mx[:gl_c]}/u,'&\1;').
gsub(/\*/u,'*'). # *
gsub(/\+/u,'+'). # +
gsub(/¢/u,'¢'). # ¢
gsub(/£/u,'£'). # £
gsub(/¥/u,'¥'). # ¥
gsub(/§/u,'§'). # §
gsub(/©/u,'©'). # ©
gsub(/ª/u,'ª'). # ª
gsub(/«/u,'«'). # «
gsub(/®/u,'®'). # ®
gsub(/°/u,'°'). # °
gsub(/±/u,'±'). # ±
gsub(/²/u,'²'). # ²
gsub(/³/u,'³'). # ³
gsub(/µ/u,'µ'). # µ
gsub(/¶/u,'¶'). # ¶
gsub(/¹/u,'¹'). # ¹
gsub(/º/u,'º'). # º
gsub(/»/u,'»'). # »
gsub(/¼/u,'¼'). # ¼
gsub(/½/u,'½'). # ½
gsub(/¾/u,'¾'). # ¾
gsub(/×/u,'×'). # ×
gsub(/÷/u,'÷'). # ÷
gsub(/¿/u,'¿'). # ¿
gsub(/À/u,'À'). # À
gsub(/Á/u,'Á'). # Á
gsub(/Â/u,'Â'). # Â
gsub(/Ã/u,'Ã'). # Ã
gsub(/Ä/u,'Ä'). # Ä
gsub(/Å/u,'Å'). # Å
gsub(/Æ/u,'Æ'). # Æ
gsub(/Ç/u,'Ç'). # Ç
gsub(/È/u,'È'). # È
gsub(/É/u,'É'). # É
gsub(/Ê/u,'Ê'). # Ê
gsub(/Ë/u,'Ë'). # Ë
gsub(/Ì/u,'Ì'). # Ì
gsub(/Í/u,'Í'). # Í
gsub(/Î/u,'Î'). # Î
gsub(/Ï/u,'Ï'). # Ï
gsub(/Ð/u,'Ð'). # Ð
gsub(/Ñ/u,'Ñ'). # Ñ
gsub(/Ò/u,'Ò'). # Ò
gsub(/Ó/u,'Ó'). # Ó
gsub(/Ô/u,'Ô'). # Ô
gsub(/Õ/u,'Õ'). # Õ
gsub(/Ö/u,'Ö'). # Ö
gsub(/Ø/u,'Ø'). # Ø
gsub(/Ù/u,'Ù'). # Ù
gsub(/Ú/u,'Ú'). # Ú
gsub(/Û/u,'Û'). # Û
gsub(/Ü/u,'Ü'). # Ü
gsub(/Ý/u,'Ý'). # Ý
gsub(/Þ/u,'Þ'). # Þ
gsub(/ß/u,'ß'). # ß
gsub(/à/u,'à'). # à
gsub(/á/u,'á'). # á
gsub(/â/u,'â'). # â
gsub(/ã/u,'ã'). # ã
gsub(/ä/u,'ä'). # ä
gsub(/å/u,'å'). # å
gsub(/æ/u,'æ'). # æ
gsub(/ç/u,'ç'). # ç
gsub(/è/u,'è'). # è
gsub(/é/u,'é'). # é
gsub(/ê/u,'ê'). # ê
gsub(/ë/u,'ë'). # ë
gsub(/ì/u,'ì'). # ì
gsub(/í/u,'í'). # í
gsub(/î/u,'î'). # î
gsub(/ï/u,'ï'). # ï
gsub(/ð/u,'ð'). # ð
gsub(/ñ/u,'ñ'). # ñ
gsub(/ò/u,'ò'). # ò
gsub(/ó/u,'ó'). # ó
gsub(/ô/u,'ô'). # ô
gsub(/õ/u,'õ'). # õ
gsub(/ö/u,'ö'). # ö
gsub(/ø/u,'ø'). # ø
gsub(/ù/u,'ù'). # ú
gsub(/ú/u,'ú'). # û
gsub(/û/u,'û'). # ü
gsub(/ü/u,'ü'). # ý
gsub(/þ/u,'þ'). # þ
gsub(/ÿ/u,'ÿ'). # ÿ
gsub(/ý/u,'ý').
gsub(/
/u,'
').
gsub(/#{Mx[:nbsp]}/u,' ')
end
end
class Tune
def initialize(data,md)
@data,@md=data,md
@vz=SiSU_Env::GetInit.instance.skin
@env=SiSU_Env::InfoEnv.new(@md.fns)
@sys=SiSU_Env::SystemCall.new
@env=SiSU_Env::InfoEnv.new(@md.fns)
@brace_url=SiSU_Viz::Skin.new.url_decoration
end
def songsheet
begin
@cX=SiSU_Screen::Ansi.new(@md.opt.cmd).cX
SiSU_Screen::Ansi.new(@md.opt.cmd,'Tune').txt_grey if @md.opt.cmd =~/[MVv]/
data=SiSU_EPUB_Tune::Tune.new(@data,@md).amp_html
data=SiSU_EPUB_Tune::Tune.new(data,@md).endnotes_html
data=SiSU_EPUB_Tune::Tune.new(data,@md).url_markup
data=SiSU_EPUB_Tune::Tune.new(data,@md).markup
if @md.opt.cmd =~/M/ #Hard Output Tune Optional on/off here
data=SiSU_EPUB_Tune::Output.new(data,@md).hard_output
SiSU_EPUB_Tune::Output.new(data,@md).marshal
end
tuned=SiSU_EPUB_Tune::Tune.new(@data,@md).output
rescue
SiSU_Errors::InfoError.new($!,$@,@md.opt.cmd,@md.fns).error do
__LINE__.to_s + ':' + __FILE__
end
ensure
end
end
def markup
@tuned_file=[]
@data.each do |dob|
dob.obj=dob.obj.gsub(/#{Mx[:mk_o]}#([a-zA-Z]+)#{Mx[:mk_c]}/,'&\1;').
gsub(/#{Mx[:mk_o]}(#[0-9]+)#{Mx[:mk_c]}/,'&\1;')
dob.obj=dob.obj.gsub(/#{Mx[:br_line]}|#{Mx[:br_nl]}/,'
') unless dob.is==:table
dob.obj=dob.obj.gsub(/#{Mx[:fa_bold_o]}(.+?)#{Mx[:fa_bold_c]}/,'\1').
gsub(/#{Mx[:fa_italics_o]}(.+?)#{Mx[:fa_italics_c]}/,'\1').
gsub(/#{Mx[:fa_underscore_o]}(.+?)#{Mx[:fa_underscore_c]}/,'\1').
gsub(/#{Mx[:fa_superscript_o]}(.+?)#{Mx[:fa_superscript_c]}/,'\1').
gsub(/#{Mx[:fa_subscript_o]}(.+?)#{Mx[:fa_subscript_c]}/,'\1').
gsub(/#{Mx[:fa_insert_o]}(.+?)#{Mx[:fa_insert_c]}/,'\1').
gsub(/#{Mx[:fa_cite_o]}(.+?)#{Mx[:fa_cite_c]}/,'\1').
gsub(/#{Mx[:fa_strike_o]}(.+?)#{Mx[:fa_strike_c]}/,'\1').
gsub(/#{Mx[:fa_monospace_o]}(.+?)#{Mx[:fa_monospace_c]}/,'\1'). # tt, kbd
gsub(/#{Mx[:mk_o]}:name#(\S+?)#{Mx[:mk_c]}/,'').
gsub(/#{Mx[:gl_bullet]}/m,'● ').
gsub(/#{Mx[:nbsp]}/,' ').
gsub(/<(p|br)>/,'<\1 />')
dob.obj=SiSU_EPUB_Tune::CleanXHTML.new(dob.obj).clean
@tuned_file << dob
end
end
def urls(data)
@words=[]
map_nametags=SiSU_Particulars::CombinedSingleton.instance.get_map_nametags(@md).nametags_map #p map_nametags
data.each do |word|
@words << if word=~/#{Mx[:lnk_o]}(.+?)#{Mx[:lnk_c]}(?:#{Mx[:url_o]}\S+?#{Mx[:url_c]}|#{Mx[:rel_o]}\S+?#{Mx[:rel_c]}|image)/
http_=true
if word =~/#{Mx[:lnk_o]}.+?#{Mx[:lnk_c]}#{Mx[:url_o]}\S+?#{Mx[:url_c]}/
m,u=/#{Mx[:lnk_o]}(.+?)#{Mx[:lnk_c]}#{Mx[:url_o]}(\S+?)#{Mx[:url_c]}/.match(word).captures
elsif word =~/#{Mx[:lnk_o]}.+?#{Mx[:lnk_c]}#{Mx[:rel_o]}\S+?#{Mx[:rel_c]}/
http_=false
m,u=/#{Mx[:lnk_o]}(.+?)#{Mx[:lnk_c]}#{Mx[:rel_o]}(\S+?)#{Mx[:rel_c]}/.match(word).captures
elsif word =~/#{Mx[:lnk_o]}.+?#{Mx[:lnk_c]}image/
m,u=/#{Mx[:lnk_o]}(.+?)#{Mx[:lnk_c]}(image)/.match(word).captures
end
case m
when /\.png|\.jpg|\.gif|c=|\s\d+x\d+/
w,h=/\s(\d+)x(\d+)/.match(m).captures if m =~/\s\d+x\d+/
w=%{width="#{w}"} if w
h=%{height="#{h}"} if h
c=m[/"(.+?)"/m,1]
caption=%{
#{c}
} if c
png=m.scan(/\S+/)[0]
image_path=@md.file.output_path.epub.rel_image #image_path=@env.url.images_epub
ins=if u \
and u.strip !~/^image$/
%{#{caption}}
else %{#{caption}}
end
word=word.gsub(/#{Mx[:lnk_o]}.+?#{Mx[:lnk_c]}(?:#{Mx[:url_o]}\S+?#{Mx[:url_c]}|image)/,ins)
else
link=m[/(.+)/m]
png=m.scan(/\S+/)[0].strip
link=link.strip
u=u.sub(/^#*/,'') #make neater
if map_nametags[u] \
and map_nametags[u][:segname]
u=unless http_
u=if u=~/^\d+$/
u.gsub(/^(\d+)$/,"#{map_nametags[u][:segname]}#{Sfx[:xhtml]}#o\\1") if u !~/\//
else
u.gsub(/(\S+)/,"#{map_nametags[u][:segname]}#{Sfx[:xhtml]}#\\1") if u !~/\//
end
else u
end
elsif u =~/^:/
u=u.gsub(/^:/,"#{@env.url.root}/")
elsif u =~/^\.\.\//
u=u.gsub(/^\.\.\//,"#{@env.url.root}/")
elsif u =~/https?:\/\//
else p "NOT FOUND name_tags: #{u}"
end
ins=%{#{link}}
word=word.gsub(/#{Mx[:lnk_o]}.+?#{Mx[:lnk_c]}#{Mx[:url_o]}\S+?#{Mx[:url_c]}/,ins).
gsub(/#{Mx[:lnk_o]}.+?#{Mx[:lnk_c]}#{Mx[:rel_o]}\S+?#{Mx[:rel_c]}/,ins)
end
word
else word
end
word
end
@words=@words.join(' ')
end
def url_markup
data=@data
@tuned_file=[]
data.each do |dob|
unless dob.is==:code
if dob.obj =~/<::\s+/ #watch
dob.obj=dob.obj.gsub(/<::\s+(\S+?)\s+!>/,
%{})
end
if dob.obj =~/<:image\s+/
dob.obj=dob.obj.gsub(/<:image\s+(http\S+)\s+(\S+)\s+(\S+)\s+(\S+)\s+>/,
%{}).
gsub(/<:image\s+(http\S+)\s+(\S+)\s+>/,
%{}).
gsub(/<:image\s+(\S+)\s+(\S+)\s+(\S+)\s+>/,
%{}).
gsub(/<:image\s+(\S+)\s+>/,
%{})
end
if dob.obj =~/#{Mx[:lnk_o]}.+?#{Mx[:lnk_c]}(?:#{Mx[:url_o]}\S+?#{Mx[:url_c]}|#{Mx[:rel_o]}\S+?#{Mx[:rel_c]}|image)/
@word_mode=dob.obj.scan(/#{Mx[:lnk_o]}.+?#{Mx[:lnk_c]}(?:#{Mx[:url_o]}\S+?#{Mx[:url_c]}|#{Mx[:rel_o]}\S+?#{Mx[:rel_c]}|image)[()\[\]]*[,.;:!?'"]{0,2}|(?:#{Mx[:gl_o]}\S+?#{Mx[:gl_c]})+|[^#{Mx[:lnk_o]}#{Mx[:lnk_c]}]+/mu)
words=urls(@word_mode)
dob.obj=dob.obj.gsub(/.+/m,words)
end
dob.obj=dob.obj.gsub(/\\copyright/i,%{©})
dob.obj=if (dob.obj !~/\<:ad\s+\.\.\//)
dob.obj.gsub(/\<:ad\s+(\S+)?\s+(\S+\.png)\s+(.+)?\;\s+(.+)?\;\s*!\>/,
%{\n\n})
else
dob.obj.gsub(/\<:ad\s+(\S+)?\s+(\S+\.png)\s+(.+)?\;\s+(.+)?\;\s*\>/,
%{\n\n})
end
dob.obj=dob.obj.gsub(/!pick/,%{}).
gsub(/!new/,%{ }).
gsub(/<:h(.{1,7}?)>/,'\1').
gsub(/<:to(\d{1,7}?)>/,'to { \1 } ').
gsub(/#{Mx[:url_o]}_(\S+?)#{Mx[:url_c]}/,'\1'). #http ftp matches escaped, no decoration
gsub(/#{Mx[:url_o]}([a-zA-Z0-9._-]+\@\S+?\.[a-zA-Z0-9._-]+)#{Mx[:url_c]}/,%{#{@brace_url.xml_open}\\1#{@brace_url.xml_close}}).
gsub(/#{Mx[:url_o]}(\S+?)#{Mx[:url_c]}/,%{#{@brace_url.xml_open}\\1#{@brace_url.xml_close}}) #http ftp matches with decoration
if dob.obj =~/..\/\S+/ \
and dob.obj !~/(\"..\/\S+?\"|>\s*..\/\S+<)/
dob.obj=dob.obj.gsub(/(\.\.\/\S+)/,'\1')
end
dob.obj=dob.obj.gsub(//m,'>')
end
@tuned_file << dob
end
end
def amp_html
data,data_new=@data,[]
data.each do |dob|
dob.obj=dob.obj.gsub(/&/u,'&')
data_new << dob
end
data_new
end
def endnotes_html
data=@data
@tuned_file=[]
a,s='_a','_s'
ast,pls='*','+'
data.each do |dob|
unless dob.is ==:code
dob.obj=dob.obj.gsub(/(#{Mx[:en_a_o]}|#{Mx[:en_b_o]})(\d+)\s+(.+?)(#{Mx[:en_a_c]}|#{Mx[:en_b_c]})/,
%{#{Mx[:nbsp]}#{Mx[:nbsp]}\\2#{Mx[:nbsp]} } + #note- endnote-
%{\\1\\2 #{Mx[:nbsp]}\\2. \\3 \\4}). #endnote- note- (careful may have switched)
gsub(/(#{Mx[:en_b_o]})[*](\d+)\s+(.+?)(#{Mx[:en_b_c]})/,
%{#{Mx[:nbsp]}#{Mx[:nbsp]}#{ast}\\2#{Mx[:nbsp]} } + #note- endnote-
%{\\1#{ast}\\2 #{Mx[:nbsp]}#{ast}\\2. \\3 \\4}). #endnote- note- (careful may have switched)
gsub(/(#{Mx[:en_b_o]})[+](\d+)\s+(.+?)(#{Mx[:en_b_c]})/,
%{#{Mx[:nbsp]}#{Mx[:nbsp]}#{pls}\\2#{Mx[:nbsp]} } + #note- endnote-
%{\\1#{pls}\\2 #{Mx[:nbsp]}#{pls}\\2. \\3 \\4}) #endnote- note- (careful may have switched) # double-check there may here be a bug
if dob.obj =~/#{Mx[:en_a_o]}([*+]+)\s+.+?#{Mx[:en_a_c]}/
m=$1.length.to_i
dob.obj=dob.obj.gsub(/(#{Mx[:en_a_o]})[*]+\s+(.+?)(#{Mx[:en_a_c]})/,
%{#{Mx[:nbsp]}#{Mx[:nbsp]}#{ast*m}#{Mx[:nbsp]} } + #note- endnote-
%{\\1#{ast*m} #{Mx[:nbsp]}#{ast*m} \\2 \\3}). #endnote- note- (careful may have switched)
gsub(/(#{Mx[:en_a_o]})([+]+)\s+(.+?)(#{Mx[:en_a_c]})/,
%{#{Mx[:nbsp]}#{Mx[:nbsp]}#{pls*m}#{Mx[:nbsp]} } + #note- endnote-
%{\\1#{pls*m} #{Mx[:nbsp]}#{pls*m} \\2 \\3}) #endnote- note- (careful may have switched)
end
end
@tuned_file << dob
end
end
def output
data=@data
@tuned_file=[]
data.each do |dob|
dob.obj=dob.obj.strip.chomp
@tuned_file << dob
end
@tuned_file << "\n" if (@md.fns =~/\.sst0/) #remove
@tuned_file
end
end
end
__END__