/usr/share/doc/libtext-csv-xs-perl/examples/parser-xs.pl is in libtext-csv-xs-perl 1.11-2.
This file is owned by root:root, with mode 0o755.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 | #!/usr/bin/perl
# This script can be used as a base to parse unreliable CSV streams
# Modify to your own needs
#
# (m)'08 [23 Apr 2008] Copyright H.M.Brand 2008-2014
use strict;
use warnings;
use Text::CSV_XS;
my $csv = Text::CSV_XS->new ({ binary => 1,
blank_is_undef => 1,
eol => $/,
});
my $csa = Text::CSV_XS->new ({ binary => 1,
allow_loose_quotes => 1,
blank_is_undef => 1,
escape_char => undef,
});
my $file = @ARGV ? shift : "test.csv";
open my $fh, "<", $file or die "$file: $!\n";
my %err_eol = map { $_ => 1 } 2010, 2027, 2031, 2032;
print STDERR "Reading $file with Text::CSV_XS $Text::CSV_XS::VERSION\n";
while (1) {
my $row = $csv->getline ($fh);
unless ($row) { # Parsing failed
# Could be end of file
$csv->eof and last;
# Diagnose and show what was wrong
my @diag = $csv->error_diag;
print STDERR "$file line $./$diag[2] - $diag[0] - $diag[1]\n";
my $ep = $diag[2] - 1; # diag[2] is 1-based
my $ein = $csv->error_input; # The line scanned so far
my $err = $ein . " ";
substr $err, $ep + 1, 0, "*"; # Bad character marked between **
substr $err, $ep, 0, "*";
($err = substr $err, $ep - 5, 12) =~ s/ +$//;
print STDERR " |$err|\n";
REPARSE: { # Now retry with allowed options
if ($csa->parse ($ein)) {
print STDERR "Accepted in allow mode ...\n";
$row = [ $csa->fields ];
}
else { # Still fails
my @diag = $csa->error_diag;
if (exists $err_eol{$diag[0]}) { # \r or \n inside field
print STDERR " Extending line with next chunk\n";
$ein .= scalar <$fh>;
goto REPARSE;
}
print STDERR " Also could not parse it in allow mode\n";
print STDERR " $./$diag[2] - $diag[0] - $diag[1]\n";
print STDERR " Line skipped\n";
next;
}
}
}
# Data was fine, print data properly quoted
$csv->print (*STDOUT, $row);
}
|