sorting file according to a unicode column

Discussion in 'Perl Misc' started by ehabaziz2001@gmail.com, May 28, 2014.

  1. Guest

    Dear All,
    I need to use that below script but with no success . Even I try to use the ucsort script but also with no success . Any help
    The files columns separated with '|' and the column position 9 with length 200.

    use encoding 'utf8';
    my @File;
    my %Positions_and_lenghts = (
    9 => 180 ,
    );



    #For external file
    open FILE, '>:utf8', 'F:\programs\sedawk\xerox_scripts\AlexBank\logs\all_cycle_data.sorted' or die "$^E\n";
    binmode STDOUT, ':utf8';


    while (my $line = <DATA>) {
    my $row;
    foreach my $POS (sort {$a<=>$b} keys %Positions_and_lenghts) {
    push @{$row}, substr $line, $POS, $Positions_and_lenghts{$POS}
    }
    push @File, $row


    }


    #use Data::Dumper; print Dumper(\@File);exit;

    foreach my $row (sort {$a->[0] cmp $b->[0] || $a->[2] cmp $b->[2]} @File) {
    print "@{$row}\n"



    }
    , May 28, 2014
    #1
    1. Advertising

  2. # just works

    my @lines;
    while (<DATA>) {chomp; push @lines, [split /\|/, $_,-1]}

    foreach(sort { $a->[9] cmp $b->[9] } @lines) {print "@{$_}\n"}


    __DATA__
    ||||||||one|γ|3
    ||||||||two|α|2
    ||||||||six|β|1
    George Mpouras, May 28, 2014
    #2
    1. Advertising

  3. Guest

    Here it is the whole program after your modifications :
    -------------------------------------------------------

    use encoding 'utf8';
    my @File;
    my %Positions_and_lenghts = (
    9 => 200 ,
    );



    #For external file
    open FILE, '>:utf8', 'F:\programs\sedawk\xerox_scripts\AlexBank\logs\all_cycle_data.sorted' or die "$^E\n";
    binmode STDOUT, ':utf8';


    while (my $line = <DATA>) {

    my @lines;
    while (<DATA>) {chomp; push @lines, [split /\|/, $_,-1]}

    foreach(sort { $a->[9] cmp $b->[9] } @lines) {print "@{$_}\n"}
    push @{$row}, substr $line, $POS, $Positions_and_lenghts{$POS}
    }
    push @File, $row


    }

    Here is a sample of my long line (Required sorted field is fld2 pos9,length200):
    ------------------------------------------------------------------------------
    514|- شركه مانتراك | 20206105400|0 |0 |0 |سعد زغلول |CORPORATEحساب جاري |YTMPW-bEUcE5a.RPT |EGYPT ALEXANDRIA ALEXANDRIA â€â€ â€Ø§Ù„كيلو28 العامريه الاسكندريه
    , May 31, 2014
    #3
  4. If you are on a proper installed linux system and your files are already
    valid utf8, then you do not need the definitions
    # open FILE, '>:utf8',
    # binmode STDOUT, ':utf8';
    based on the sample line, the following code will do the job






    #!/usr/bin/perl
    use strict;
    use warnings;



    my $column = 9; # use this column for sorting
    my $offset_start = 29; # importand position of the column start (count
    from 0)
    my $offset_end = 60; # importand position of the column end (count
    from 0)
    my @lines;


    open FILE, '<', '/tmp/file1.txt' or die "oh no ! \"$!\"\n";

    while (<FILE>) {
    chomp;
    my $order_by = (split /\|/, $_, -1)[$column];
    my $Length = length $order_by;
    my $offend = $offset_end > $Length ? $Length : $offset_end;
    $order_by = substr $order_by, $offset_start, ($offset_end-$offset_start);
    push @lines, [$order_by, $_]
    }

    close FILE;

    # use Data::Dumper; print Dumper \@lines;

    foreach (sort { $a->[0] cmp $b->[0] } @lines) {
    print "$_->[1]\n"
    }
    George Mpouras, Jun 2, 2014
    #4
  5. there was a type at the code, here is the correct


    #!/usr/bin/perl
    use strict;
    use warnings;



    # http://unicode.org/charts/PDF/U0600.pdf

    # 1,3 29

    my $column = 8; # use this column for sorting
    my $offset_start = 1; # importand position of the column start (count
    from 0)
    my $offset_end = 3; # importand position of the column end (count
    from 0)
    my @lines;


    open FILE, '<', '/tmp/file1.txt' or die "oh no ! \"$!\"\n";

    while (<FILE>) {
    chomp;
    my $order_by = (split /\|/, $_, -1)[$column];
    my $Length = length $order_by;
    my $offend = $offset_end > $Length ? $Length : $offset_end;
    $order_by = substr $order_by, $offset_start, ($offend-$offset_start);
    push @lines, [$order_by, $_]
    }

    close FILE;

    # use Data::Dumper; print Dumper \@lines;

    foreach (sort { $a->[0] cmp $b->[0] } @lines) {
    print "$_->[1]\n"
    }
    George Mpouras, Jun 2, 2014
    #5
  6. #!/usr/bin/perl
    use strict;
    use warnings;

    my $column = 9; # use this column for sorting
    my $offset_start = 29; # importand position of the column start (count
    from 0)
    my $offset_end = 50; # importand position of the column end (count
    from 0)
    my @lines;

    open FILE, '<', '/tmp/file1.txt' or die "oh no ! \"$!\"\n";

    while (<FILE>) {
    chomp;
    my $order_by = (split /\|/, $_, -1)[$column];
    my $Length = length $order_by;
    my $offend = $offset_end > $Length ? $Length : $offset_end;
    $order_by = substr $order_by, $offset_start, ($offend-$offset_start);
    push @lines, [$order_by, $_]
    }

    close FILE;

    foreach (sort { $a->[0] cmp $b->[0] } @lines) {
    print "$_->[1]\n"
    }
    George Mpouras, Jun 2, 2014
    #6
  7. Guest

    I am running perl under XP dos box.
    ------------------------------------
    I got that errors after running :
    F:\COMPILER\Perl\bin\perl sorting.pl 1.log

    Here is my script:
    -----------------

    use strict;
    use warnings;

    my $column = 2; # use this column for sorting
    my $offset_start = 9; # importand position of the column start (count
    from 0)
    my $offset_end = 209; # importand position of the column end (count
    from 0)
    my @lines;

    open FILE, '<', 'F:\programs\sedawk\xerox_scripts\AlexBank\scripts\1.log' or die "oh no ! \"$!\"\n";

    while (<FILE>) {
    chomp;
    my $order_by = (split /\|/, $_, -1)[$column];
    my $Length = length $order_by;
    my $offend = $offset_end > $Length ? $Length : $offset_end;
    $order_by = substr $order_by, $offset_start, ($offend-$offset_start);
    push @lines, [$order_by, $_]
    }

    close FILE;

    The error :
    -----------
    Number found where operator expected at sorting.pl line 6, near "from 0"
    (Do you need to predeclare from?)
    Number found where operator expected at sorting.pl line 8, near "from 0"
    (Do you need to predeclare from?)
    syntax error at sorting.pl line 6, near "from 0"
    Can't use global $! in "my" at sorting.pl line 11, near "oh no ! "$!"
    Execution of sorting.pl aborted due to compilation errors.
    F:\programs\sedawk\xerox_scripts\AlexBank\scripts>
    , Jun 2, 2014
    #7
  8. Guest

    Please I can not see any output with the below command :
    F:\COMPILER\Perl\bin\perl sorting.pl 1.log


    On Wednesday, May 28, 2014 4:22:10 PM UTC+2, wrote:
    > Dear All,
    >
    > I need to use that below script but with no success . Even I try to use the ucsort script but also with no success . Any help
    >
    > The files columns separated with '|' and the column position 9 with length 200.
    >
    >
    >
    > use encoding 'utf8';
    >
    > my @File;
    >
    > my %Positions_and_lenghts = (
    >
    > 9 => 180 ,
    >
    > );
    >
    >
    >
    >
    >
    >
    >
    > #For external file
    >
    > open FILE, '>:utf8', 'F:\programs\sedawk\xerox_scripts\AlexBank\logs\all_cycle_data.sorted' or die "$^E\n";
    >
    > binmode STDOUT, ':utf8';
    >
    >
    >
    >
    >
    > while (my $line = <DATA>) {
    >
    > my $row;
    >
    > foreach my $POS (sort {$a<=>$b} keys %Positions_and_lenghts) {
    >
    > push @{$row}, substr $line, $POS, $Positions_and_lenghts{$POS}
    >
    > }
    >
    > push @File, $row
    >
    >
    >
    >
    >
    > }
    >
    >
    >
    >
    >
    > #use Data::Dumper; print Dumper(\@File);exit;
    >
    >
    >
    > foreach my $row (sort {$a->[0] cmp $b->[0] || $a->[2] cmp $b->[2]} @File) {
    >
    > print "@{$row}\n"
    >
    >
    >
    >
    >
    >
    >
    > }
    , Jun 2, 2014
    #8
  9. writes:
    > I am running perl under XP dos box.
    > ------------------------------------
    > I got that errors after running :
    > F:\COMPILER\Perl\bin\perl sorting.pl 1.log


    [...]

    > my $offset_start = 9; # importand position of the column start (count
    > from 0)


    > my $offset_end = 209; # importand position of the column end (count
    > from 0)


    The 'from 0)' belongs to the comment started the respective lines
    above. It must not appear alone on a line, as it does here.
    Rainer Weikusat, Jun 2, 2014
    #9
  10. Guest

    How can I eecute it under dos . Is like this ?

    F:\COMPILER\Perl\bin\perl sorting.pl input_file.log



    بتاريخ الاثنين، 2 يونيو، 2014 UTC+2 9:13:37 م، كتب Rainer Weikusat:
    > writes:
    >
    > > I am running perl under XP dos box.

    >
    > > ------------------------------------

    >
    > > I got that errors after running :

    >
    > > F:\COMPILER\Perl\bin\perl sorting.pl 1.log

    >
    >
    >
    > [...]
    >
    >
    >
    > > my $offset_start = 9; # importand position of the column start (count

    >
    > > from 0)

    >
    >
    >
    > > my $offset_end = 209; # importand position of the column end (count

    >
    > > from 0)

    >
    >
    >
    > The 'from 0)' belongs to the comment started the respective lines
    >
    > above. It must not appear alone on a line, as it does here.
    , Jun 3, 2014
    #10
  11. Στις 3/6/2014 11:57, ο/η έγÏαψε:
    > How can I eecute it under dos . Is like this ?
    >
    > F:\COMPILER\Perl\bin\perl sorting.pl input_file.log
    >
    >
    >
    > بتاريخ الاثنين، 2 يونيو، 2014 UTC+2 9:13:37 م، كتب Rainer Weikusat:
    >> writes:
    >>
    >>> I am running perl under XP dos box.

    >>
    >>> ------------------------------------

    >>
    >>> I got that errors after running :

    >>
    >>> F:\COMPILER\Perl\bin\perl sorting.pl 1.log






    At windows using the notepad++ create a script lets say the test.pl and write there the
    Perl code. then all you have to do is execute

    test.pl inputdata.txt outputsorted.txt

    copy/paste the following lines at test.pl
    ################################################################################






    use strict;
    use warnings;

    my $file_input = exists $ARGV[0] ? (-f $ARGV[0] ? $ARGV[0]: die "The input file does not
    exist\n") : die "You did not define the input file\n";
    my $file_output = exists $ARGV[1] ? $ARGV[1] : die "You did not define any output file\n";
    my $column = 9; # use this column for sorting
    my $offset_start= 29; # importand position of the column start (count from 0)
    my $offset_end = 50; # importand position of the column end (count from 0)
    my @lines;

    open IN, '<:utf8', $file_input or die "Fatal error \"$!\"\n";
    while (<IN>) {
    chomp;
    my $order_by = (split /\|/, $_, -1)[$column];
    my $Length = length $order_by;
    my $offend = $offset_end > $Length ? $Length : $offset_end;
    $order_by = substr $order_by, $offset_start, ($offend-$offset_start);
    push @lines, [$order_by, $_]
    }
    close IN;

    open OUT, '>:utf8', $file_output or die "Fatal error \"$!\"\n";
    foreach (sort { $a->[0] cmp $b->[0] } @lines) {
    print OUT "$_->[1]\n"
    }
    close OUT;
    George Mpouras, Jun 3, 2014
    #11
  12. On 2014-06-02 11:01, George Mpouras <> wrote:
    > If you are on a proper installed linux system and your files are already
    > valid utf8, then you do not need the definitions
    > # open FILE, '>:utf8',
    > # binmode STDOUT, ':utf8';


    Yes, you do, if you want a definition of offset meaningful for a user.

    Consider this file:

    ---------------
    Grüß Gott de_at
    ΚαλημέÏα gr
    ã“ã‚“ã«ã¡ã¯ jp
    ---------------

    The first column is 11 characters wide, the second takes the rest, and
    you want to sort by the second column. So you get the key with

    my $key = substr($_, 11);

    right?

    But the German umlauts and Greek characters are each 2 bytes in utf-8
    and the Japanese characters are 3 bytes. So what's the correct offset
    for each line? You can't tell a priori, because it depends on the
    specific characters in the first column. But if you decode the UTF-8
    first, it's just 11 characters and you don't have to worry about how
    many bytes it is.

    So, this produces the correct output:

    #!/usr/bin/perl

    use warnings;
    use strict;
    use autodie;

    my $enc = ':encoding(UTF-8)';
    #my $enc = '';
    open(my $in_fh, "<$enc", $ARGV[0]);
    binmode(STDOUT, $enc);

    my @lines;

    while (<$in_fh>) {
    chomp;
    my $key = substr($_, 11);
    push @lines, [ $key, $_ ];
    }
    @lines = sort { $a->[0] cmp $b->[0] } @lines;

    for (@lines) {
    print "$_->[1] [$_->[0]]\n";
    }

    But if you use the empty $enc, it produces garbage.

    Of course in reality it is more complicated.

    Japanese and Chinese characters are often displayed at double width,
    so if I had edited my file to make the columns match up nicely in my
    editor, the last line would have needed an offset of 6 instead of 11.
    And for many characters there is a composed and a decomposed form: "Ü"
    could be <LATIN SMALL LETTER U WITH DIAERESIS> or <LATIN SMALL LETTER U>
    + <COMBINING DIARESIS>. The latter of course counts as two characters
    for substr.

    Management summary: Avoid character offsets in file formats.

    hp

    --
    _ | Peter J. Holzer | Fluch der elektronischen Textverarbeitung:
    |_|_) | | Man feilt solange an seinen Text um, bis
    | | | | die Satzbestandteile des Satzes nicht mehr
    __/ | http://www.hjp.at/ | zusammenpaßt. -- Ralph Babel
    Peter J. Holzer, Jun 5, 2014
    #12
  13. Guest

    I have executed your script with successful results but I want to update the sorting column which the name(length 200 char) . It is the second column starting with position 9 and ending 209 but what is the index of the columns in perl? . does the starting column named column 0 or column 1 ???
    my $column = 1; # use this column for sorting
    my $offset_start= 9; # importand position of the column start (count from0)
    my $offset_end = 209; # importand position of the column end (count from 0)

    my file :

    923|يونس عبداللطي٠يونس الحنÙÙ‰ | 31701246200|0 |0 |0 |سمنود |حساب المصــرى |CTMP_RalicE5a.RPT |مصر الدقهلية اجا â€â€ â€Ø§Ù„دير - Ù… اجا



    بتاريخ الأربعاء، 28 مايو، 2014 UTC+2 4:22:10 م، كتب :
    > Dear All,
    >
    > I need to use that below script but with no success . Even I try to use the ucsort script but also with no success . Any help
    >
    > The files columns separated with '|' and the column position 9 with length 200.
    >
    >
    >
    > use encoding 'utf8';
    >
    > my @File;
    >
    > my %Positions_and_lenghts = (
    >
    > 9 => 180 ,
    >
    > );
    >
    >
    >
    >
    >
    >
    >
    > #For external file
    >
    > open FILE, '>:utf8', 'F:\programs\sedawk\xerox_scripts\AlexBank\logs\all_cycle_data.sorted' or die "$^E\n";
    >
    > binmode STDOUT, ':utf8';
    >
    >
    >
    >
    >
    > while (my $line = <DATA>) {
    >
    > my $row;
    >
    > foreach my $POS (sort {$a<=>$b} keys %Positions_and_lenghts) {
    >
    > push @{$row}, substr $line, $POS, $Positions_and_lenghts{$POS}
    >
    > }
    >
    > push @File, $row
    >
    >
    >
    >
    >
    > }
    >
    >
    >
    >
    >
    > #use Data::Dumper; print Dumper(\@File);exit;
    >
    >
    >
    > foreach my $row (sort {$a->[0] cmp $b->[0] || $a->[2] cmp $b->[2]} @File){
    >
    > print "@{$row}\n"
    >
    >
    >
    >
    >
    >
    >
    > }
    , Jun 11, 2014
    #13
  14. Guest

    I also got these error and noted no English names found in the sorted resulting file :

    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 201.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 632.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 1108.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 1165.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 1166.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 1167.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 1466.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 1467.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 1494.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 1672.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 1870.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 1887.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 2026.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 2027.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 2108.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 2301.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 2890.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3217.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3218.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3478.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3503.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3504.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3606.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 3835.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3865.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3866.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3867.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3868.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3869.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3870.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3871.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3872.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3873.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3874.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3875.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3876.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3877.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3878.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3879.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3880.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3881.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 3882.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 4196.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 4641.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 4642.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 4860.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 4861.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 5278.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 5279.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 5529.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 5530.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 5531.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 7804.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 8437.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 8438.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 8439.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 8507.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 8508.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 9524.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 9525.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 9526.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 9527.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 9528.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 9529.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 9799.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 10201.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 10246.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 10252.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 10253.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 10254.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 10672.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 10673.
    utf8 "\xE2" does not map to Unicode at sorting.pl line 29, <IN> line 11838.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 12370.
    utf8 "\xE2" does not map to Unicode at sorting.pl line 29, <IN> line 12634.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 12655.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 12656.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 12701.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 12834.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 13587.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 13588.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 14219.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 14220.
    utf8 "\xE2" does not map to Unicode at sorting.pl line 29, <IN> line 14839.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 14842.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 16218.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 16247.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 16371.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 16634.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 16635.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 16951.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 16952.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 16972.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 16973.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 16974.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 17072.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 17077.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 17078.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 17276.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 17693.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 18160.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 18183.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 18184.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 18202.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 18566.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 18623.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 18643.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 18644.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 19259.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 19360.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 19727.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 19731.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 19871.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 19942.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 19986.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 20055.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 20056.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 20057.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 20074.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 20113.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 20147.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 20220.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 20626.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 20804.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 20873.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 20927.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 20980.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 21051.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 21052.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 21335.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 21336.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 21527.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 21528.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 21833.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 21856.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 21857.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 22110.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 22174.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 22350.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 22430.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 22651.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 22845.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 22888.
    utf8 "\xE2" does not map to Unicode at sorting.pl line 29, <IN> line 22960.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 23146.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 23215.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 23282.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 23283.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 24010.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 24011.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 24526.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 24527.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 24845.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 24846.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 24847.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 24908.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 24915.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 24971.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 25073.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 25466.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 25598.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 25617.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 25618.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 25874.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 26495.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 26548.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 26668.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 26877.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 26960.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 26984.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 27105.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 27120.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 27262.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 27306.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 27383.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 27555.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 27556.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 27557.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 27661.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 27793.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 27794.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 28287.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 28288.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 28289.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 28982.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 30768.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 31052.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 31053.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 31061.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 31233.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 31322.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 31323.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 31427.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 31450.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 31451.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 31452.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 31453.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 31789.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 31790.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 31791.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 32058.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 32165.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 32404.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 32641.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 32642.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 32910.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 33253.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 33300.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 33663.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 33741.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 33742.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 34034.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 34035.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 34097.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 34098.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 34099.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 34100.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 34101.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 34102.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 34103.
    utf8 "\xE2" does not map to Unicode at sorting.pl line 29, <IN> line 34151.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 34161.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 34162.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 34246.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 34267.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 34268.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 34457.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 34553.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 34676.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 34756.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 35091.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 35092.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 35098.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 35099.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 35100.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 35104.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 35105.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 35160.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 35447.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 35604.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 36021.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 36133.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 36486.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 36738.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 36739.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 36912.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 37088.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 37743.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 37822.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 38148.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 38197.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 38198.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 38199.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 38626.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 38831.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 38832.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 38915.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 38916.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 39329.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 39373.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 39797.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 40877.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 40972.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 40973.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 41165.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 41166.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 41690.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 41691.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 41694.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 41877.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 42122.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 42126.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 42495.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 42584.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 42585.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 42618.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 42619.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 42750.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 42835.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 42836.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 42851.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 42852.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 43022.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 43115.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 43402.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 43403.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 43428.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 43736.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 43754.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 43836.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 44032.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 44088.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 44089.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 44090.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 44224.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 44258.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 45016.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 45122.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 45126.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 45266.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 45376.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 45377.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 45378.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 45425.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 45845.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 46007.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 46015.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 46085.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 46513.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 46929.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 46930.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 46978.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 46979.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 47056.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 47057.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 47328.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 47329.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 47912.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 48001.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 48623.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 48634.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 48635.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 48674.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 48679.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 48772.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 48773.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 49240.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 49308.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 49465.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 49466.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 49516.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 49517.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 49519.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 49520.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 49521.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 49525.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 49638.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 49639.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 49680.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 50119.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 50120.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 50231.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 50232.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 50250.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 50251.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 50582.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 50659.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 50835.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 51057.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 51109.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 51270.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 51291.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 51417.
    Malformed UTF-8 character (unexpected end of string) in split at sorting.plline 25, <IN> line 51417.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 51489.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 51519.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 51520.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 51521.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 51711.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 51759.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 51760.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 51781.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 51862.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 52184.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 52292.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 52406.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 52407.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 52836.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 53026.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 53027.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 53235.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 53477.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 53493.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 53549.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 53612.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 53698.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 53699.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 53742.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 53770.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 53771.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 54024.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 54025.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 54128.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 54166.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 54242.
    utf8 "\xE2" does not map to Unicode at sorting.pl line 29, <IN> line 54828.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 54859.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 54860.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 54870.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 54964.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 55108.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 55138.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 55497.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 55498.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 55970.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 56032.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 56095.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 56096.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 56100.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 56122.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 56129.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 56280.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 56286.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 56424.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 56425.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 56739.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 56826.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 56907.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 56908.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 56937.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 56938.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 56973.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 57037.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 57038.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 57264.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 57626.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 57664.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 57665.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 57678.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 57706.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 57707.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 57851.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 57852.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 57853.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 57854.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 58104.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 58513.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 58514.
    utf8 "\xE2" does not map to Unicode at sorting.pl line 29, <IN> line 58694.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 58903.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 58958.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 58959.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 59323.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 59374.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 59375.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 59403.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 59615.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 59691.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 59706.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 59775.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 59776.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 59783.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 59963.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 60070.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 60071.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 60154.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 60306.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 60725.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 60795.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 60840.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 61154.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 61511.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 61512.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 61940.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 62008.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 62485.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 62709.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 62710.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 62913.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 62918.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 62927.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 62928.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 62929.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 62930.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 63119.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 63147.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 63194.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 63195.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 63613.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 63614.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 63781.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 63849.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 64026.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 64027.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 64409.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 64620.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 64709.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 64838.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 64843.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 64873.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 65006.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 65104.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 65105.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 65152.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 65206.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 65236.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 65401.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 65402.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 65403.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 65424.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 65574.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 65575.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 65576.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 65577.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 65592.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 65737.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 66403.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 66580.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 66621.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 66980.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 67040.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 67226.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 67236.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 67843.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 67844.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 68019.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 68276.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 68568.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 68970.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 69025.
    utf8 "\xE2" does not map to Unicode at sorting.pl line 29, <IN> line 69077.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 69200.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 69201.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 69245.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 69363.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 69662.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 69735.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 69736.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 69737.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 69827.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 70251.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 70252.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 70269.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 70358.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 70359.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 70473.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 70492.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 70611.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 70612.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 70700.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 71118.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 71235.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 71236.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 71393.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 71394.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 71407.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 71677.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 71678.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 71831.
    utf8 "\xE2" does not map to Unicode at sorting.pl line 29, <IN> line 71908.
    utf8 "\xE2" does not map to Unicode at sorting.pl line 29, <IN> line 71933.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 72039.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 72055.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 72251.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 72252.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 72481.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 72482.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 72756.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 72825.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 72873.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 72874.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 73551.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 73640.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 73764.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 73765.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 73820.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 74039.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 74052.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 74053.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 74186.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 74187.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 74311.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 74317.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 74318.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 74526.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 74661.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 74662.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 74888.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 75074.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 75075.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 75109.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 75110.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 75217.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 75218.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 75551.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 76285.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 76286.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 76463.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 76488.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 76489.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 76493.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 76494.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 77240.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 77241.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 77291.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 77319.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 77320.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 77356.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 77357.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 77617.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 77618.
    utf8 "\xE2" does not map to Unicode at sorting.pl line 29, <IN> line 77718.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 77725.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 77726.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 77751.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 77752.
    utf8 "\xE2" does not map to Unicode at sorting.pl line 29, <IN> line 78251.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 78382.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 78672.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 79076.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 80188.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 80297.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 80664.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 80665.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 80678.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 80691.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 80862.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 80879.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 80884.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 81031.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 81032.
    utf8 "\xE2" does not map to Unicode at sorting.pl line 29, <IN> line 81077.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 81225.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 81663.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 81664.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 81675.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 81676.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 81894.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 81895.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 81919.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 81953.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 81960.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 82250.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 82439.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 82440.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 82762.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 82763.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 82764.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 82841.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 82842.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 82843.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 82844.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 82886.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 82887.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 82960.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 82963.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 83079.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 83080.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 83081.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 84358.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 84557.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 84925.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 84926.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 85433.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 85592.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 85861.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 86428.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 86467.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 86495.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 86496.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 86776.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 86840.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 86841.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 86878.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 86879.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 87275.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 87276.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 87288.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 87303.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 87304.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 87411.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 87643.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 87644.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 87764.
    utf8 "\xE2" does not map to Unicode at sorting.pl line 29, <IN> line 88178.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 88181.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 88266.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 88450.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 88687.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 88868.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 88869.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 88870.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 88954.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 88955.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 89020.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 89691.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 89692.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 89693.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 89850.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 89851.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 89852.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 89883.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 89943.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 90002.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 90122.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 90164.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 90264.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 90269.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 90595.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 90596.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 90683.
    utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 90684.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 90838.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 90896.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 90897.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 90898.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 90899.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 90900.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 90922.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 91087.
    utf8 "\xD9" does not map to Unicode at sorting.pl line 29, <IN> line 91088.
    utf8 "\xE2" does not map to Unicode at sorting.pl line 29, <IN> line 91423.



    بتاريخ الأربعاء، 4 يونيو، 2014 UTC+2 12:17:37 ص، كتب George Mpouras:
    > Στις 3/6/2014 11:57, ο/η ehabaziz2001@gmail..com έγÏαψε:
    >
    > > How can I eecute it under dos . Is like this ?

    >
    > >

    >
    > > F:\COMPILER\Perl\bin\perl sorting.pl input_file.log

    >
    > >

    >
    > >

    >
    > >

    >
    > > بتاريخ الاثنين، 2 يونيو، 2014 UTC+2 9:13:37 م، كتب Rainer Weikusat:

    >
    > >> writes:

    >
    > >>

    >
    > >>> I am running perl under XP dos box.

    >
    > >>

    >
    > >>> ------------------------------------

    >
    > >>

    >
    > >>> I got that errors after running :

    >
    > >>

    >
    > >>> F:\COMPILER\Perl\bin\perl sorting.pl 1.log

    >
    >
    >
    >
    >
    >
    >
    >
    >
    >
    >
    > At windows using the notepad++ create a script lets say the test.pl and write there the
    >
    > Perl code. then all you have to do is execute
    >
    >
    >
    > test.pl inputdata.txt outputsorted.txt
    >
    >
    >
    > copy/paste the following lines at test.pl
    >
    > ################################################################################
    >
    >
    >
    >
    >
    >
    >
    >
    >
    >
    >
    >
    >
    > use strict;
    >
    > use warnings;
    >
    >
    >
    > my $file_input = exists $ARGV[0] ? (-f $ARGV[0] ? $ARGV[0]: die "The input file does not
    >
    > exist\n") : die "You did not define the input file\n";
    >
    > my $file_output = exists $ARGV[1] ? $ARGV[1] : die "You did not define any output file\n";
    >
    > my $column = 9; # use this column for sorting
    >
    > my $offset_start= 29; # importand position of the column start (count from 0)
    >
    > my $offset_end = 50; # importand position of the column end (count from 0)
    >
    > my @lines;
    >
    >
    >
    > open IN, '<:utf8', $file_input or die "Fatal error \"$!\"\n";
    >
    > while (<IN>) {
    >
    > chomp;
    >
    > my $order_by = (split /\|/, $_, -1)[$column];
    >
    > my $Length = length $order_by;
    >
    > my $offend = $offset_end > $Length ? $Length : $offset_end;
    >
    > $order_by = substr $order_by, $offset_start, ($offend-$offset_start);
    >
    > push @lines, [$order_by, $_]
    >
    > }
    >
    > close IN;
    >
    >
    >
    > open OUT, '>:utf8', $file_output or die "Fatal error \"$!\"\n";
    >
    > foreach (sort { $a->[0] cmp $b->[0] } @lines) {
    >
    > print OUT "$_->[1]\n"
    >
    > }
    >
    > close OUT;
    , Jun 11, 2014
    #14
  15. Στις 11/6/2014 2:18 μμ, ο/η έγÏαψε:
    > I also got these error and noted no English names found in the sorted resulting file :
    >
    > utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 201.
    > utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 632.



    I suspect that your input files are not valid utf8 ...
    George Mpouras, Jun 11, 2014
    #15
  16. Στις 11/6/2014 10:34 μμ, ο/η George Mpouras έγÏαψε:
    > Στις 11/6/2014 2:18 μμ, ο/η έγÏαψε:
    >> I also got these error and noted no English names found in the sorted
    >> resulting file :
    >>
    >> utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 201.
    >> utf8 "\xD8" does not map to Unicode at sorting.pl line 29, <IN> line 632.

    >
    >
    > I suspect that your input files are not valid utf8 ...
    >


    because I admire your patience (!) at this thread, if it is not
    something super secret compress one of these files and send it to my
    email ( change the "foo" suffix with "com" )

    G.Mpouras
    George Mpouras, Jun 11, 2014
    #16
  17. Guest

    I am sorry I can not find your email Mine is :
    , Jun 14, 2014
    #17
  18. Στις 14/6/2014 11:11 μμ, ο/η έγÏαψε:
    > I am sorry I can not find your email Mine is :
    >

    use this one

    perl -e "print pack 'h*', '76271667964716c63757e60486f647d61696c6e236f6d6'"
    George Mpouras, Jun 15, 2014
    #18
    1. Advertising

Want to reply to this thread or ask your own question?

It takes just 2 minutes to sign up (and it's free!). Just click the sign up button to choose a username and then you can ask your own questions on the forum.
Similar Threads
  1. Replies:
    5
    Views:
    8,274
    Andy Dingley
    May 7, 2005
  2. W. Van Hooste

    FILE undeclared - but its not, according to me.

    W. Van Hooste, Sep 16, 2003, in forum: C Programming
    Replies:
    9
    Views:
    4,950
    Dave Thompson
    Sep 22, 2003
  3. cesco
    Replies:
    5
    Views:
    369
    Maxim Yegorushkin
    Feb 10, 2006
  4. CMOS
    Replies:
    1
    Views:
    312
    Jack Klein
    Aug 29, 2006
  5. Poor Yorick
    Replies:
    0
    Views:
    451
    Poor Yorick
    Dec 3, 2008
Loading...

Share This Page