diff options
| -rw-r--r-- | data/doc/sisu/CHANGELOG_v3 | 3 | ||||
| -rw-r--r-- | lib/sisu/v3/character_encoding.rb | 378 | ||||
| -rw-r--r-- | lib/sisu/v3/dal_character_check.rb | 6 | ||||
| -rw-r--r-- | lib/sisu/v3/hub.rb | 4 | 
4 files changed, 6 insertions, 385 deletions
diff --git a/data/doc/sisu/CHANGELOG_v3 b/data/doc/sisu/CHANGELOG_v3 index 0731f23a..0fdf55c3 100644 --- a/data/doc/sisu/CHANGELOG_v3 +++ b/data/doc/sisu/CHANGELOG_v3 @@ -37,6 +37,9 @@ http://www.jus.uio.no/sisu/pkg/src/sisu_3.3.3.orig.tar.xz  * v3: bin/sisu, hub, reorganize call +* v3: some pre-unicode meddling sorted +  (covers bug reported as middle dot changed to asterisk by chals) +  %% 3.3.2.orig.tar.xz (2012-06-30:26/6)  http://git.sisudoc.org/?p=code/sisu.git;a=log;h=refs/tags/sisu_3.3.2  http://git.sisudoc.org/?p=code/sisu.git;a=log;h=refs/tags/debian/sisu_3.3.2-1 diff --git a/lib/sisu/v3/character_encoding.rb b/lib/sisu/v3/character_encoding.rb deleted file mode 100644 index 17bf336b..00000000 --- a/lib/sisu/v3/character_encoding.rb +++ /dev/null @@ -1,378 +0,0 @@ -# encoding: utf-8 -=begin - - * Name: SiSU - - * Description: a framework for document structuring, publishing and search - - * Author: Ralph Amissah - - * Copyright: (C) 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006, -   2007, 2008, 2009, 2010, 2011, 2012 Ralph Amissah, All Rights Reserved. - - * License: GPL 3 or later: - -   SiSU, a framework for document structuring, publishing and search - -   Copyright (C) Ralph Amissah - -   This program is free software: you can redistribute it and/or modify it -   under the terms of the GNU General Public License as published by the Free -   Software Foundation, either version 3 of the License, or (at your option) -   any later version. - -   This program is distributed in the hope that it will be useful, but WITHOUT -   ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or -   FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for -   more details. - -   You should have received a copy of the GNU General Public License along with -   this program. If not, see <http://www.gnu.org/licenses/>. - -   If you have Internet connection, the latest version of the GPL should be -   available at these locations: -   <http://www.fsf.org/licensing/licenses/gpl.html> -   <http://www.gnu.org/licenses/gpl.html> - -   <http://www.sisudoc.org/sisu/en/manifest/gpl.fsf.html> - - * SiSU uses: -   * Standard SiSU markup syntax, -   * Standard SiSU meta-markup syntax, and the -   * Standard SiSU object citation numbering and system - - * Hompages: -   <http://www.jus.uio.no/sisu> -   <http://www.sisudoc.org> - - * Download: -   <http://www.sisudoc.org/sisu/en/SiSU/download.html> - - * Ralph Amissah -   <ralph@amissah.com> -   <ralph.amissah@gmail.com> - - ** Description: modules related to locales, character encoding for different -    output generators [requires kirbybase] - -=end -module SiSU_CharacterEncode -  require 'kirbybase' -  require_relative 'sysenv'                             # sysenv.rb -  class Characters -    attr_accessor(:character_encoding,:glyph,:dec,:hex,:rb,:html,:html_name,:tex,:tex_licr,:tex_alt,:name) -    def initialize(&block) -      instance_eval(&block) -    end -  end -  class Create <Characters -    def initialize -      #NOTE places character_encoding.tbl in correct subdirectory ./_sisu_processing/encoding -      @db=KirbyBase.new                                         #default database location, pwd -      @ce_tbl=@db.create_table.documents(:character_encoding, :glyph,:String, :dec,:Integer, :hex,:String, :rb,:String, :html,:String, :html_name,:String, :tex,:String, :tex_licr,:String, :tex_alt,:String, :name,:String) -    end -    def db -      x=CharacterEncoding.new.table -      #x.each {|y| puts y[2].inspect} -      x.each do |c| -        #puts "#{c[0]}, #{c[1]}, #{c[2]}, #{c[3]}, #{c[4]}, #{c[5]}, #{c[6]}, #{c[7]}, #{c[8]}, #{c[9]}" -        @ce_tbl.insert(c[0], c[1], c[2], c[3], c[4], c[5], c[6], c[7], c[8], c[9]) -      end -    end -  end -  class Query -    def initialize(find='',show='') -      #NOTE character_encoding.tbl not read from subdirectory ./_sisu_processing/encoding -      @db=KirbyBase.new                                         #default database location, pwd -      @ce_tbl=@db.get_table(:character_encoding) -      @find=find -    end -    def selected(selected,show) -      @y=[] -      selected.each do |x| -        @y<<case show -        when 'glyph';     x.glyph -        when 'dec';       x.dec -        when 'hex';       x.hex -        when 'rb';        x.rb -        when 'html';      x.html -        when 'html_name'; x.html_name -        when 'tex';       x.tex -        when 'ot1';       x.ot1 -        when 'ts1';       x.ts1 -        when 'name';      x.name -        else              x.hex -        end -      end -      #@ce_tbl.select(:glyph,:name) { |r| r.hex==hex }.each do |r| -      #  puts '%s %s' % [r.glyph, r.name] -      #end -      #:glyph,:dec,:hex,:rb,:html,:html_name,:tex,:tex_licr,:tex_alt,:name -      #list=['number','glyph','html','hex','rb','tex','ot1','ts1','name'] -    end -    def hex(hex,show) -      select=@ce_tbl.select(:glyph,:dec,:hex,:rb,:html,:html_name,:tex,:tex_licr,:tex_alt,:name) { |r| r.hex==hex } -      selected(select,show) -      @y -    end -    def dec(dec,show) -      select=@ce_tbl.select(:glyph,:dec,:hex,:rb,:html,:html_name,:tex,:tex_licr,:tex_alt,:name) { |r| r.dec==dec } -      selected(select,show) -      @y -    end -    def name(name,show) -      select=@ce_tbl.select(:glyph,:dec,:hex,:rb,:html,:html_name,:tex,:tex_licr,:tex_alt,:name) { |r| r.name =~ /#{name}/ } -      selected(select,show) -      @y -    end -    def report -      puts @ce_tbl.select(:glyph,:dec,:hex,:rb,:html,:html_name,:tex,:tex_licr,:tex_alt,:name).to_report -    end -    def table -      selected=@ce_tbl.select -      #selected=@ce_tbl.select(:glyph,:dec,:hex,:rb,:html,:html_name,:tex,:tex_licr,:tex_alt,:name) -      selected.each do |c| -        puts '%s %s %s %s %s %s %s %s %s %s' % [c.glyph,c.dec,c.hex,c.rb,c.html,c.html_name,c.tex,c.tex_licr,c.tex_alt,c.name] -        #puts "#{c.glyph}, #{c.dec}, #{c.hex}, #{c.rb}, #{c.html}, #{c.name}, #{c.tex}, #{c.tec_licr}, #{c.tex_alt}, #{c.c_name}" -      end -    end -  end -  class CharacterEncoding -    def table -      x=[] -#:glyph, :dec,:hex,  :rb,            :xml ,   :html_name,  :tex,    :tex_licr,         :tex_alt,          :name -      x=[ -  ['',     9, '',    '',             '	', nil,         '',     '',                '',                'Horizontal tab'  ], -  ['',    15, '',    '',             '', nil,         '',     '',                '',                'Line feed'       ], -  ['',    17, '',    '',             '', nil,         '',     '',                '',                'Carriage return' ], -  [' ',   32, '40',  '\40',          ' ', nil,         '',     '',                '',                'Space'           ], -  ['!',   33, '41',  '\41',          '!', nil,         '!',    '!',               '!',               'Punctuation Exclamation !' ], -  ['',    34, '42',  '\42',          '"', '"',    '',     '',                '',                'Punctuation Quotation mark' ], -  ['#',   35, '43',  '\43',          '#', nil,         '{\#}', '\#',              '',                'Hash mark    #' ], -  ['$',   36, '44',  '\44',          '$', nil,         '{\$}', '\textdollar',     '',                'Dollar sign  $' ], -  ['%',   37, '45',  '\45',          '%', nil,         '{\%}', '\%',              '',                'Percent sign %' ], -  ['&',   38, '46',  '\46',          '&', '&',     '{\&}', '\&',              '',                'Ampersand    &' ], -  ['\'',  39, '47',  '\47',          ''', nil,         '',     '',                '',                'Apostrophe   \''], -  ['(',   40, '50',  '\50',          '(', nil,         '',     '',                '',                'Left parenthesis  (' ], -  [')',   41, '51',  '\51',          ')', nil,         '',     '',                '',                'Right parenthesis )' ], -  ['*',   42, '52',  '\52',          '*', nil,         '',     '',                '',                'Asterisk     *' ], -  ['+',   43, '53',  '\53',          '+', nil,         '',     '',                '',                'Plus sign    +' ], -  [',',   44, '54',  '\54',          ',', nil,         ',',    ',',               ',',               'Puncutation Comma  ,' ], -  ['-',   45, '55',  '\55',          '-', nil,         '-',    '-',               '-',               'Puncutation Hyphen -' ], -  ['.',   46, '56',  '\56',          '.', nil,         '.',    '.',               '.',               'Puncutation Period .' ], -  ['/',   47, '57',  '\57',          '/', nil,         '/',    '/',               '/',               'Puncutation Slash  /' ], -  ['0',   48, '60',  '\60',          '0', nil,         '0',    '0',               '0',               'Digit zero  0' ], -  ['1',   49, '61',  '\61',          '1', nil,         '1',    '1',               '1',               'Digit one   1' ], -  ['2',   50, '62',  '\62',          '2', nil,         '2',    '2',               '2',               'Digit two   2' ], -  ['3',   51, '63',  '\63',          '3', nil,         '3',    '3',               '3',               'Digit three 3' ], -  ['4',   52, '64',  '\64',          '4', nil,         '4',    '4',               '4',               'Digit four  4' ], -  ['5',   53, '65',  '\65',          '5', nil,         '5',    '5',               '5',               'Digit five  5' ], -  ['6',   54, '66',  '\66',          '6', nil,         '6',    '6',               '6',               'Digit six   6' ], -  ['7',   55, '67',  '\67',          '7', nil,         '7',    '7',               '7',               'Digit seven 7' ], -  ['8',   56, '70',  '\70',          '8', nil,         '8',    '8',               '8',               'Digit eight 8' ], -  ['9',   57, '71',  '\71',          '9', nil,         '9',    '9',               '9',               'Digit nine  9' ], -  [':',   58, '72',  '\72',          ':', nil,         '',     '',                '',                'Punctuation Colon     :' ], -  [';',   59, '73',  '\73',          ';', nil,         '',     '',                '',                'Punctuation Semicolon ;' ], -  ['<',   60, '74',  '\74',          '<', '<',      '',     '',                '',                'Less than    <' ], -  ['=',   61, '75',  '\75',          '=', nil,         '',     '',                '',                'Equals sign  =' ], -  ['>',   62, '76',  '\76',          '>', '>',      '',     '',                '',                'Greater than >' ], -  ['?',   63, '77',  '\77',          '?', nil,         '?',    '?',               '?',               'Punctuation Question mark ?' ], -  ['@',   64, '100', '\100',         '@', nil,         '',     '',                '',                'Commercial at sign           @' ], -  ['A',   65, '101', '\101',         'A', nil,         'A',    'A',               'A',               'Captial A' ], -  ['B',   66, '102', '\102',         'B', nil,         'B',    'B',               'B',               'Captial B' ], -  ['C',   67, '103', '\103',         'C', nil,         'C',    'C',               'C',               'Captial C' ], -  ['D',   68, '104', '\104',         'D', nil,         'D',    'D',               'D',               'Captial D' ], -  ['E',   69, '105', '\105',         'E', nil,         'E',    'E',               'E',               'Captial E' ], -  ['F',   70, '106', '\106',         'F', nil,         'F',    'F',               'F',               'Captial F' ], -  ['G',   71, '107', '\107',         'G', nil,         'G',    'G',               'G',               'Captial G' ], -  ['H',   72, '110', '\110',         'H', nil,         'H',    'H',               'H',               'Captial H' ], -  ['I',   73, '111', '\111',         'I', nil,         'I',    'I',               'I',               'Captial I' ], -  ['J',   74, '112', '\112',         'J', nil,         'J',    'J',               'J',               'Captial J' ], -  ['K',   75, '113', '\113',         'K', nil,         'K',    'K',               'K',               'Captial K' ], -  ['L',   76, '114', '\114',         'L', nil,         'L',    'L',               'L',               'Captial L' ], -  ['M',   77, '115', '\115',         'M', nil,         'M',    'M',               'M',               'Captial M' ], -  ['N',   78, '116', '\116',         'N', nil,         'N',    'N',               'N',               'Captial N' ], -  ['O',   79, '117', '\117',         'O', nil,         'O',    'O',               'O',               'Captial O' ], -  ['P',   80, '120', '\120',         'P', nil,         'P',    'P',               'P',               'Captial P' ], -  ['Q',   81, '121', '\121',         'Q', nil,         'Q',    'Q',               'Q',               'Captial Q' ], -  ['R',   82, '122', '\122',         'R', nil,         'R',    'R',               'R',               'Captial R' ], -  ['S',   83, '123', '\123',         'S', nil,         'S',    'S',               'S',               'Captial S' ], -  ['T',   84, '124', '\124',         'T', nil,         'T',    'T',               'T',               'Captial T' ], -  ['U',   85, '125', '\125',         'U', nil,         'U',    'U',               'U',               'Captial U' ], -  ['V',   86, '126', '\126',         'V', nil,         'V',    'V',               'V',               'Captial V' ], -  ['W',   87, '127', '\127',         'W', nil,         'W',    'W',               'W',               'Captial W' ], -  ['X',   88, '130', '\130',         'X', nil,         'X',    'X',               'X',               'Captial X' ], -  ['Y',   89, '131', '\131',         'Y', nil,         'Y',    'Y',               'Y',               'Captial Y' ], -  ['Z',   90, '132', '\132',         'Z', nil,         'Z',    'Z',               'Z',               'Captial Z' ], -  ['[',   91, '133', '\133',         '[', nil,         '',     '',                '',                'Left square bracket  [' ], -  ['\\',  92, '134', '\134',         '\', nil,         '',     '\textbackslash',  '',                'Backslash            \\'], -  [']',   93, '135', '\135',         ']', nil,         '',     '',                '',                'Right square bracket ]' ], -  ['^',   94, '136', '\136',         '^', nil,         '',     '',                '',                'Caret                ^' ], -  ['_',   95, '137', '\137',         '_', nil,         '{\_}', '\textunderscore', '',                'Underscore           _' ], -  ['`',   96, '140', '\140',         '`', nil,         '',     '',                '',                'Grave accent         `' ], -  ['a',   97, '141', '\141',         'a', nil,         'a',    'a',               'a',               'Small a' ], -  ['b',   98, '142', '\142',         'b', nil,         'b',    'b',               'b',               'Small b' ], -  ['c',   99, '143', '\143',         'c', nil,         'c',    'c',               'c',               'Small c' ], -  ['d',  100, '144', '\144',         'd', nil,         'd',    'd',               'd',               'Small d' ], -  ['e',  101, '145', '\145',         'e', nil,         'e',    'e',               'e',               'Small e' ], -  ['f',  102, '146', '\146',         'f', nil,         'f',    'f',               'f',               'Small f' ], -  ['g',  103, '147', '\147',         'g', nil,         'g',    'g',               'g',               'Small g' ], -  ['h',  104, '150', '\150',         'h', nil,         'h',    'h',               'h',               'Small h' ], -  ['i',  105, '151', '\151',         'i', nil,         'i',    'i',               'i',               'Small i' ], -  ['j',  106, '152', '\152',         'j', nil,         'j',    'j',               'j',               'Small j' ], -  ['k',  107, '153', '\153',         'k', nil,         'k',    'k',               'k',               'Small k' ], -  ['l',  108, '154', '\154',         'l', nil,         'l',    'l',               'l',               'Small l' ], -  ['m',  109, '155', '\155',         'm', nil,         'm',    'm',               'm',               'Small m' ], -  ['n',  110, '156', '\156',         'n', nil,         'n',    'n',               'n',               'Small n' ], -  ['o',  111, '157', '\157',         'o', nil,         'o',    'o',               'o',               'Small o' ], -  ['p',  112, '160', '\160',         'p', nil,         'p',    'p',               'p',               'Small p' ], -  ['q',  113, '161', '\161',         'q', nil,         'q',    'q',               'q',               'Small q' ], -  ['r',  114, '162', '\162',         'r', nil,         'r',    'r',               'r',               'Small r' ], -  ['s',  115, '163', '\163',         's', nil,         's',    's',               's',               'Small s' ], -  ['t',  116, '164', '\164',         't', nil,         't',    't',               't',               'Small t' ], -  ['u',  117, '165', '\165',         'u', nil,         'u',    'u',               'u',               'Small u' ], -  ['v',  118, '166', '\166',         'v', nil,         'v',    'v',               'v',               'Small v' ], -  ['w',  119, '167', '\167',         'w', nil,         'w',    'w',               'w',               'Small w' ], -  ['x',  120, '170', '\170',         'x', nil,         'x',    'x',               'x',               'Small x' ], -  ['y',  121, '171', '\171',         'y', nil,         'y',    'y',               'y',               'Small y' ], -  ['z',  122, '172', '\172',         'z', nil,         'z',    'z',               'z',               'Small z' ], -  ['{',  123, '173', '\173',         '{', nil,         '{\{}', '\{',              '',                'Left curly brace     {' ], -  ['|',  124, '174', '\174',         '|', nil,         '',     '',                '',                'Vertical bar / pipe  |' ], -  ['}',  125, '175', '\175',         '}', nil,         '{\}}', '\}',              '',                'Right curly brace    }' ], -  ['~',  126, '176', '\176',         '~', nil,         '',     '',                '',                'Tilde                ~' ], -  ['',   127, '177', '',             '', nil,         '',     '',                '',                '                      ' ], -  ['',   128, '200', '',             '€', nil,         '',     '',                '',                '                      ' ], -  ['',   129, '201', '',             '', nil,         '',     '',                '',                '                      ' ], -  ['\'', 130, '202', '',             '‚', nil,         '',     '',                '',                'Low left single quote        \''], -  [' ',  131, '203', '',             'ƒ', nil,         '',     '',                '',                'Florin                        ' ], -  ['"',  132, '204', '',             '„', nil,         '',     '',                '',                'Low left double quote        "' ], -  ['…',  133, '205', '\342\200\246', '…', nil,         '…',    '\textellipsis',   '',                'Ellipsis             …' ], -  ['†',  134, '206', '\342\200\240', '†', nil,         '†',    '\textdagger',     '',                'Dagger               †' ], -  ['‡',  135, '207', '\342\200\241', '‡', nil,         '‡',    '\textdaggerbl',   '',                'Double dagger        ‡' ], -  ['^',  136, '210', '',             'ˆ', nil,         '',     '',                '',                'Circumflex           ^' ], -  ['',   137, '211', '',             '‰', nil,         '',     '',                '',                'Permil               ' ], -  ['',   138, '212', '',             'Š', nil,         '',     '',                '',                'Capital S, caron     ' ], -  ['<',  139, '213', '',             '‹', nil,         '',     '',                '',                'Less than sign (see &060;)   <' ], -  ['',   140, '214', '',             'Œ', nil,         '',     '',                '',                'Capital OE ligature   ' ], -  ['',   141, '215', '',             '', nil,         '',     '',                '',                '                      ' ], -  ['',   142, '216', '',             'Ž', nil,         '',     '',                '',                'Capital Z, caron      ' ], -  ['',   143, '217', '',             '', nil,         '',     '',                '',                '                      ' ], -  ['',   144, '220', '',             '', nil,         '',     '',                '',                '                      ' ], -  ['',   145, '221', '',             '‘', nil,         '',     '',                '',                'Left single quote     ' ], -  ['',   146, '222', '',             '’', nil,         '',     '',                '',                'Right single quote    ' ], -  ['',   147, '223', '',             '“', nil,         '',     '',                '',                'Left double quote     ' ], -  ['',   148, '224', '',             '”', nil,         '',     '',                '',                'Right double quote    ' ], -  ['',   149, '225', '',             '•', nil,         '',     '',                '',                'Bullet                ' ], -  ['-',  150, '226', '',             '–', nil,         '',     '',                '',                'En dash              -' ], -  ['',   151, '227', '',             '—', nil,         '',     '',                '',                'Em dash              -' ], -  ['~',  152, '230', '',             '˜', nil,         '',     '',                '',                'Tilde (see &126;)    ~' ], -  ['t',  153, '231', '',             '™', nil,         '',     '',                '',                'Trademark            t' ], -  ['',   154, '232', '',             'š', nil,         '',     '',                '',                'small s, caron        ' ], -  ['',   155, '233', '',             '›', nil,         '',     '',                '',                'Greater than sign (see &062;) ' ], -  ['',   156, '234', '',             'œ', nil,         '',     '',                '',                'Small oe ligature        ' ], -  ['',   157, '235', '',             '', nil,         '',     '',                '',                '                         ' ], -  ['',   158, '236', '',             'ž', nil,         '',     '',                '',                'Small z, caron           ' ], -  ['',   159, '237', '',             'Ÿ', nil,         '',     '',                '',                'Capital Y, umlaut        ' ], -  ['',   160, '240', '',             ' ', ' ',    '',     '',                '',                'Non-breaking space       ' ], -  ['¡',  161, '241', '\302\241',     '¡', '¡',   '¡',    '',                '',                'Inverted exclamation     ' ], -  ['¢',  162, '242', '\302\242',     '¢', '¢',    '¢',    '',                '',                'Cent sign               ¢' ], -  ['£',  163, '243', '\302\243',     '£', '£',   '£',    '\textsterling',   '',                'Pound sign              £' ], -  ['¤',  164, '244', '\302\244',     '¤', '¤',  '¤',    '\textcurrency',   '',                'General currency sign    ' ], -  ['¥',  165, '245', '\302\245',     '¥', '¥',     '¥',    '',                '',                'Yen sign                ¥' ], -  ['¦',  166, '246', '\302\246',     '¦', '¦',  '¦',    '',                '',                'Broken vertical bar      ' ], -  ['§',  167, '247', '\302\247',     '§', '§',    '§',    '\textsection',    '',                'Section sign            §' ], -  ['¨',  168, '250', '\302\250',     '¨', '¨',     '¨',    '\"',              '',                'Umlaut                   ' ], -  ['©',  169, '251', '\302\251',     '©', '©',    '©',    '\copyright',      '\textcopyright',  'Copyright               ©' ], -  ['ª',  170, '252', '\302\252',     'ª', 'ª',    'ª',    '',                '',                'Feminine ordinal        ª' ], -  ['«',  171, '253', '\302\253',     '«', '«',   '«',    '',                '',                'Left angle quote        «' ], -  ['¬',  172, '254', '\302\254',     '¬', '¬',     '¬',    '',                '',                'Not sign                 ' ], -  ['',  173, '255', '\302\255',     '­', '­',     '',    '',                '',                'Soft hyphen              ' ], -  ['®',  174, '256', '\302\256',     '®', '®',     '®',    '',                '',                'Registered trademark    ®' ], -  ['¯',  175, '257', '\302\257',     '¯', '¯',    '¯',    '',                '',                'Macron accent            ' ], -  ['°',  176, '260', '\302\260',     '°', '°',     '°',    '',                '',                'Degree sign             °' ], -  ['±',  177, '261', '\302\261',     '±', '&plusmin;', '±',    '',                '',                'Plus or minus           ±' ], -  ['²',  178, '262', '\302\262',     '²', '²',    '²',    '',                '',                'Superscript 2           ²' ], -  ['³',  179, '263', '\302\263',     '³', '³',    '³',    '',                '',                'Superscript 3           ³' ], -  ['',   180, '264', '\302\264',     '´', '´',   ''',    '',                '',                'Acute accent             ' ], -  ['µ',  181, '265', '\302\265',     'µ', 'µ',   'µ',    '',                '',                'Micro sign (Greek mu)   µ' ], -  ['¶',  182, '266', '\302\266',     '¶', '¶',    '¶',    '\textparagraph',  '',                'Paragraph sign          ¶' ], -  ['·',  183, '267', '\302\267',     '·', '·',  %q{·},  '',                %q{},              'Middle dot               ' ], -  ['¸',  184, '270', '\302\270',     '¸', '¸',   '¸',    '',                '',                'Cedilla                  ' ], -  ['¹',  185, '271', '\302\271',     '¹', '¹',    '¹',    '',                '',                'Superscript 1           ¹' ], -  ['º',  186, '272', '\302\272',     'º', 'º',    'º',    '',                '',                'Masculine ordinal       º' ], -  ['»',  187, '273', '\302\273',     '»', '»',   '»',    '',                '',                'Right angle quote        ' ], -  ['¼',  188, '274', '\302\274',     '¼', '¼',  '¼',    '',                '',                'Fraction one quarter    ¼' ], -  ['½',  189, '275', '\302\275',     '½', '½',  '½',    '',                '',                'Fraction on half        ½' ], -  ['¾',  190, '276', '\302\276',     '¾', '¾',  '¾',    '',                '',                'Fraction three quarters ¾' ], -  ['¿',  191, '277', '\302\277',     '¿', '¿',  '¿',    '',                '',                'Inverted question mark  ¿' ], -  ['À',  192, '300', '\303\200',     'À', 'À',  'À',    '\`{A}',           '',                'Capital A, grave accent À' ], -  ['Á',  193, '301', '\303\201',     'Á', 'Á',  'Á',    %q{\'{A}},         '',                'Capital A, acute accent Á' ], -  ['Â',  194, '302', '\303\202',     'Â', 'Â',   'Â',    '^{A}',            '',                'Capital A, circumflex accent Â' ], -  ['Ã',  195, '303', '\303\203',     'Ã', 'Ã',  'Ã',    '~{A}',            '',                'Capital A, tilde        Ã' ], -  ['Ä',  196, '304', '\303\204',     'Ä', 'Ä',    'Ä',    '"{A}',            '',                'Capital A, umlaut       Ä' ], -  ['Å',  197, '305', '\303\205',     'Å', 'Å',   'Å',    'r{A}',            '',                'Capital A, ring         Å' ], -  ['Æ',  198, '306', '\303\206',     'Æ', 'Æ',   'Æ',    'AE',              '',                'Capital AE ligature     Æ' ], -  ['Ç',  199, '307', '\303\207',     'Ç', 'Ç',  'Ç',    '',                '',                'Capital C, cedilla      Ç' ], -  ['È',  200, '310', '\303\210',     'È', 'È',  'È',    '`{E}',            '',                'Capital E, grave accent È' ], -  ['É',  201, '311', '\303\211',     'É', 'É',  'É',    ''{E}',            '',                'Capital E, acute accent É' ], -  ['Ê',  202, '312', '\303\212',     'Ê', 'Ê',   'Ê',    '^{E}',            '',                'Capital E, circumflex accent Ê' ], -  ['Ë',  203, '313', '\303\213',     'Ë', 'Ë',    'Ë',    '"{E}',            '',                'Capital E, umlaut       Ë' ], -  ['Ì',  204, '314', '\303\214',     'Ì', 'Ì',  'Ì',    '`{I}',            '',                'Capital I, grave accent Ì' ], -  ['Í',  205, '315', '\303\215',     'Í', 'Í',  'Í',    ''{I}',            '',                'Capital I, acute accent Í' ], -  ['Î',  206, '316', '\303\216',     'Î', 'Î',   'Î',    '^{I}',            '',                'Capital I, circumflex accent Î' ], -  ['Ï',  207, '317', '\303\217',     'Ï', 'Ï',    'Ï',    '"{I}',            '',                'Capital I, umlaut       Ï' ], -  ['Ð',  208, '320', '\303\220',     'Ð', 'Ð',     'Ð',    '',                '',                'Capital eth, Icelandic   ' ], -  ['Ñ',  209, '321', '\303\221',     'Ñ', 'Ñ',  'Ñ',    '',                '',                'Capital N, tilde        Ñ' ], -  ['Ò',  210, '322', '\303\222',     'Ò', 'Ò',  'Ò',    '`{O}',            '',                'Capital O, grave accent Ò' ], -  ['Ó',  211, '323', '\303\223',     'Ó', 'Ó',  'Ó',    ''{O}',            '',                'Capital O, acute accent Ó' ], -  ['Ô',  212, '324', '\303\224',     'Ô', 'Ô',   'Ô',    '^{O}',            '',                'Capital O, circumflex accent Ô' ], -  ['Õ',  213, '325', '\303\225',     'Õ', 'Õ',  'Õ',    '~{O}',            '',                'Capital O, tilde        Õ' ], -  ['Ö',  214, '326', '\303\226',     'Ö', 'Ö',    'Ö',    '"{O}',            '',                'Capital O, umlaut       Ö' ], -  ['×',  215, '327', '\303\227',     '×', '×',   '×',    '',                '',                'Multiply sign           ×' ], -  ['Ø',  216, '330', '\303\230',     'Ø', 'Ø',  'Ø',    'O',               '',                'Capital O, slash        Ø' ], -  ['Ù',  217, '331', '\303\231',     'Ù', 'Ù',  'Ù',    '',                '',                'Capital U, grave accent Ù' ], -  ['Ú',  218, '332', '\303\232',     'Ú', 'Ú',  'Ú',    '',                '',                'Capital U, acute accent Ú' ], -  ['Û',  219, '333', '\303\233',     'Û', 'Û',   'Û',    '',                '',                'Capital U, circumflex accent Û' ], -  ['Ü',  220, '334', '\303\234',     'Ü', 'Ü',    'Ü',    '',                '',                'Capital U, umlaut       Ü' ], -  ['Ý',  221, '335', '\303\235',     'Ý', 'Ý',  'Ý',    '',                '',                'Capital Y, acute accent Ý' ], -  ['Þ',  222, '336', '\303\236',     'Þ', 'Þ',   'Þ',    '',                '',                'Capital thorn, Icelandic     Þ' ], -  ['ß',  223, '337', '\303\237',     'ß', 'ß',   'ß',    '',                '',                'Small sz ligature, German    ß' ], -  ['à',  224, '340', '\303\240',     'à', 'à',  'à',    '\`{a}',           '',                'Small a, grave accent   à' ], -  ['á',  225, '341', '\303\241',     'á', 'á',  'á',    %q{\'{a}},         '',                'Small a, acute accent   á' ], -  ['â',  226, '342', '\303\242',     'â', 'â',   'â',    '\^{a}',           '',                'Small a, circumflex accent   â' ], -  ['ã',  227, '343', '\303\243',     'ã', 'ã',  'ã',    '\~{a}',           '',                'Small a, tilde          ã' ], -  ['ä',  228, '344', '\303\244',     'ä', 'ä',    'ä',    '\"{a}',           '',                'Small a, umlaut         ä' ], -  ['å',  229, '345', '\303\245',     'å', 'å',   'å',    '\r{a}',           '',                'Small a, ring           å' ], -  ['æ',  230, '346', '\303\246',     'æ', 'æ',   'æ',    '\ae',             '',                'Small ae ligature       æ' ], -  ['ç',  231, '347', '\303\257',     'ç', 'ç',  'ç',    '',                '',                'Small c, cedilla        ç' ], -  ['è',  232, '350', '\303\250',     'è', 'è',  'è',    '\`{e}',           '',                'Small e, grave accent   è' ], -  ['é',  233, '351', '\303\251',     'é', 'é',  'é',    %q{\'{e}},         '',                'Small e, acute accent   é' ], -  ['ê',  234, '352', '\303\252',     'ê', 'ê',   'ê',    '\^{e}',           '',                'Small e, circumflex accent   ê' ], -  ['ë',  235, '353', '\303\253',     'ë', 'ë',    'ë',    '\"{e}',           '',                'Small e, umlaut         ë' ], -  ['ì',  236, '354', '\303\254',     'ì', 'ì',  'ì',    '\`{i}',           '',                'Small i, grave accent   ì' ], -  ['í',  237, '355', '\303\255',     'í', 'í',  'í',    '\'{i}',           '',                'Small i, acute accent   í' ], -  ['î',  238, '356', '\303\256',     'î', 'î',   'î',    '\^{i}',           '',                'Small i, circumflex accent   î' ], -  ['ï',  239, '357', '\303\257',     'ï', 'ï',    'ï',    '\"{i}',           '',                'Small i, umlaut         ï' ], -  ['ð',  240, '360', '\303\260',     'ð', 'ð',     'ð',    '',                '',                'Small eth, Icelandic    ð' ], -  ['ñ',  241, '361', '\303\261',     'ñ', 'ñ',  'ñ',    '',                '',                'Small n, tilde          ñ' ], -  ['ò',  242, '362', '\303\262',     'ò', 'ò',  'ò',    '\`{o}',           '',                'Small o, grave accent   ò' ], -  ['ó',  243, '363', '\303\263',     'ó', 'ó',  'ó',    %q{\'{o}},         '',                'Small o, acute accent   ó' ], -  ['ô',  244, '364', '\303\264',     'ô', 'ô',   'ô',    '\^{o}',           '',                'Small o, circumflex accent   ô' ], -  ['õ',  245, '365', '\303\265',     'õ', 'õ',  'õ',    '\^{o}',           '',                'Small o, tilde          õ' ], -  ['ö',  246, '366', '\303\266',     'ö', 'ö',    'ö',    '\"{o}',           '',                'Small o, umlaut         ö' ], -  ['÷',  247, '367', '\303\267',     '÷', '÷',  '÷',    '',                '',                'Divide sign             ÷' ], -  ['ø',  248, '370', '\303\270',     'ø', 'ø',  'ø',    '',                '',                'Small o, slash          ø' ], -  ['ù',  249, '371', '\303\271',     'ù', 'ù',  'ù',    '\`{u}',           '',                'Small u, grave accent   ù' ], -  ['ú',  250, '372', '\303\272',     'ú', 'ú',  'ú',    %q{\'{u}},         '',                'Small u, acute accent   ú' ], -  ['û',  251, '373', '\303\273',     'û', 'û',   'û',    '\^{u}',           '',                'Small u, circumflex accent   û' ], -  ['ü',  252, '374', '\303\274',     'ü', 'ü',    'ü',    '\"{u}',           '',                'Small u, umlaut         ü' ], -  ['ý',  253, '375', '\303\275',     'ý', 'ý',  'ý',    '',                '',                'Small y, acute accent   ý' ], -  ['þ',  254, '376', '\303\276',     'þ', 'þ',   'þ',    '',                '',                'Small thorn, Icelandic  þ' ], -  ['ÿ',  255, '377', '\303\277',     'ÿ', 'ÿ',    'ÿ',    '',                '',                'Smally y, umlaut        ÿ' ], -  ['∝',     ,    '',         '',    '∝', '∝',    '∝',    '',                '',                'proportional to  U+221D (8733) ∝' ], -  ['∞',     ,    '',         '',    '∞', '∞',   '∞',    '',                '',                'infinity  U+221E (8734) ∞' ], -] -    end -  end -end -__END__ diff --git a/lib/sisu/v3/dal_character_check.rb b/lib/sisu/v3/dal_character_check.rb index fdba5086..df14e1aa 100644 --- a/lib/sisu/v3/dal_character_check.rb +++ b/lib/sisu/v3/dal_character_check.rb @@ -78,8 +78,6 @@ module SiSU_DAL_CharacterCheck              gsub(/<br>/,"#{Mx[:br_line]}").                              #needed by xml, xhtml etc.              gsub(/\t/,' ').              gsub(/\342\200\231/u,"'"). #if dob =~/’/  #Avoid #‘ ’ #“ ” -            gsub(/�/u,' ').                                              #watch, replace with char code -            gsub(/·/u,'*').              gsub(/\\copy(?:right)?\b/,'©').              gsub(/\\trademark\b|\\tm\b/,'®')            dob.obj=dob.obj + "\n" @@ -87,7 +85,9 @@ module SiSU_DAL_CharacterCheck              case dob.obj              when /\^~/                                     #% Note must do this first (earlier loop) and then enter gathered data into ~^\d+                sub_dob=dob.obj.dup -              @endnote_array << sub_dob.gsub(/\n/,'').gsub(/\^~\s+(.+)\s*/,%{#{Mx[:en_a_o]}#{endnote_no} \\1 #{Mx[:en_a_c]}}).strip +              @endnote_array << sub_dob.gsub(/\n/,''). +                gsub(/\^~\s+(.+)\s*/,%{#{Mx[:en_a_o]}#{endnote_no} \\1 #{Mx[:en_a_c]}}). +                strip                endnote_no+=1                dob=nil if dob.obj =~/\^~ .+/                #watch, removes 'binary' endnote now in endnote array for later insertion              end diff --git a/lib/sisu/v3/hub.rb b/lib/sisu/v3/hub.rb index ac103830..2ab95052 100644 --- a/lib/sisu/v3/hub.rb +++ b/lib/sisu/v3/hub.rb @@ -209,10 +209,6 @@ p "#{__LINE__}:#{__FILE__}" if @opt.act[:maintenance][:set] ==:on        require_relative 'cgi'                           # cgi.rb        SiSU_CGI::SearchSQL.new(@opt).read      end -    def encoding                                       # -K build character encoding db (uses KirbyBase) -      require_relative 'character_encoding'            # character_encoding.rb -      SiSU_CharacterEncode::Create.new.db -    end      def termsheet                                          # -t        system("sisu_termsheet #{@opt.cmd} #{@opt.fns}\n")        @@n_do=@@n_do+1  | 
