lib/scripts/fixgreek.pl
author wenzelm
Thu, 29 Apr 2004 06:04:01 +0200
changeset 14687 e089757b952a
parent 14171 0cab06e3bbd0
child 14981 e73f8140af78
permissions -rw-r--r--
added is_keyword;
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
14171
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
     1
#
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
     2
# $Id$
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
     3
# Author: Sebastian Skalberg, TU Muenchen
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
     4
# License: GPL (GNU GENERAL PUBLIC LICENSE)
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
     5
#
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
     6
# fixgreek.pl - fix problems with greek and other foreign letters now
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
     7
#               being classified as letters instead of symbols.
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
     8
#
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
     9
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    10
sub fixgreek {
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    11
    my ($file) = @_;
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    12
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    13
    open (FILE, $file) || die $!;
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    14
    undef $/; $text = <FILE>; $/ = "\n";         # slurp whole file
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    15
    close FILE || die $!;
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    16
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    17
    $_ = $text;
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    18
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    19
    s/(\\<(a|b|c|d|e|f|g|h|i|j|k|l|m|n|o|p|q|r|s|t|u|v|w|x|y|z|A|B|C|D|E|F|G|H|I|J|K|L|M|N|O|P|Q|R|S|T|U|V|W|X|Y|Z)>)([a-zA-Z0-9])/$1 $3/sg;
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    20
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    21
    s/([a-zA-Z][a-zA-Z0-9]*)(\\<(a|b|c|d|e|f|g|h|i|j|k|l|m|n|o|p|q|r|s|t|u|v|w|x|y|z|A|B|C|D|E|F|G|H|I|J|K|L|M|N|O|P|Q|R|S|T|U|V|W|X|Y|Z)>)/$1 $2/sg;
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    22
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    23
    s/(\\<(aa|bb|cc|dd|ee|ff|gg|hh|ii|jj|kk|ll|mm|nn|oo|pp|qq|rr|ss|tt|uu|vv|ww|xx|yy|zz|AA|BB|CC|DD|EE|FF|GG|HH|II|JJ|KK|LL|MM|NN|OO|PP|QQ|RR|SS|TT|UU|VV|WW|XX|YY|ZZ)>)([a-zA-Z0-9])/$1 $3/sg;
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    24
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    25
    s/([a-zA-Z][a-zA-Z0-9]*)(\\<(aa|bb|cc|dd|ee|ff|gg|hh|ii|jj|kk|ll|mm|nn|oo|pp|qq|rr|ss|tt|uu|vv|ww|xx|yy|zz|AA|BB|CC|DD|EE|FF|GG|HH|II|JJ|KK|LL|MM|NN|OO|PP|QQ|RR|SS|TT|UU|VV|WW|XX|YY|ZZ)>)/$1 $2/sg;
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    26
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    27
    s/(\\<(alpha|beta|gamma|delta|epsilon|zeta|eta|theta|iota|kappa|mu|nu|xi|pi|rho|sigma|tau|upsilon|phi|psi|omega|Gamma|Delta|Theta|Lambda|Xi|Pi|Sigma|Upsilon|Phi|Psi|Omega)>)([a-zA-Z0-9])/$1 $3/sg;
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    28
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    29
    s/([a-zA-Z][a-zA-Z0-9]*)(\\<(alpha|beta|gamma|delta|epsilon|zeta|eta|theta|iota|kappa|mu|nu|xi|pi|rho|sigma|tau|upsilon|phi|psi|omega|Gamma|Delta|Theta|Lambda|Xi|Pi|Sigma|Upsilon|Phi|Psi|Omega)>)/$1 $2/sg;
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    30
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    31
    $result = $_;
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    32
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    33
    if ($text ne $result) {
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    34
	print STDERR "fixing $file\n";
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    35
        if (! -f "$file~~") {
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    36
	    rename $file, "$file~~" || die $!;
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    37
        }
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    38
	open (FILE, "> $file") || die $!;
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    39
	print FILE $result;
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    40
	close FILE || die $!;
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    41
    }
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    42
}
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    43
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    44
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    45
## main
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    46
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    47
foreach $file (@ARGV) {
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    48
  eval { &fixgreek($file); };
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    49
  if ($@) { print STDERR "*** fixgreek $file: ", $@, "\n"; }
0cab06e3bbd0 Extended the notion of letter and digit, such that now one may use greek,
skalberg
parents:
diff changeset
    50
}