summaryrefslogblamecommitdiffstats
path: root/modules/misc_cleanup/numbers.pl
blob: 567494fedef27908be7311f3af7b13b0024a8dab (plain) (tree)





















































































                                                                                                                     
#!/usr/bin/perl

# numbers.pl translates Western numbers into Arabic-Indic numbers in the textnodes of XML files

## Licensed under the standard BSD license:

# Copyright (c) 2002-2011 CrossWire Bible Society <http://www.crosswire.org/>
# All rights reserved.
#
# Redistribution and use in source and binary forms, with or without
# modification, are permitted provided that the following conditions are
# met:
#
#     * Redistributions of source code must retain the above copyright
#        notice, this list of conditions and the following disclaimer.
#     * Redistributions in binary form must reproduce the above copyright
#       notice, this list of conditions and the following disclaimer in
#       the documentation and/or other materials provided with the
#       distribution.
#     * Neither the name of the CrossWire Bible Society nor the names of
#       its contributors may be used to endorse or promote products
#       derived from this software without specific prior written
#       permission.
#
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS
# IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
# TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A
# PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
# OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
# LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
# DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
# THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

## For general inquiries, comments, suggestions, bug reports, etc. email:
## sword-support@crosswire.org

#########################################################################
use XML::LibXML;
use utf8;
use strict;

## Obtain arguments
if (scalar(@ARGV) < 1) {
    print "\nnumbers.pl <osisfile> [-o outputfile]-- - fix Latin numbers in Arabic script text \n";
    print "- Arguments in braces < > are required. Arguments in brackets [ ] are optional.\n";
    print "- If no -o option is specified for the output filename, the default output file is: \n\t<osisfile>.new\n";
    exit (-1);
}

my $file = @ARGV[0];
my $nextarg = 1;
my $outputFilename;

if (@ARGV[$nextarg] eq "-o") {
    $outputFilename = "@ARGV[$nextarg+1]";
    open (OUTF, , ">", "$outputFilename") or die "Could not open file @ARGV[2] for writing.";
    select(OUTF);
}

## Initialise OSIS file

my $parser = XML::LibXML->new();
my $doc = $parser->parse_file($file);

&delatinize($doc);

print $doc->toString();

sub delatinize(){
    my $node = @_[0];
    if ($node->nodeType==XML_TEXT_NODE) {
        my $text  = $node->toString();
        $text =~ tr/[0123456789]/[۰۱۲۳۴۵۶۷۸۹]/;
        $node->replaceDataString($node->toString,$text);
    }
    else { 
        my @children = $node->childNodes();
        foreach (@children) {
            &delatinize($_);
        }
    }
}