fast_csv 0.1.22 fast_csv: ^0.1.22 copied to clipboard
Classic non-configurable CSV parser suitable for most use cases. Pretty fast parsing.
fast_csv #
Classic non-configurable CSV parser suitable for most use cases. Pretty fast parsing.
Version: 0.1.22
Also demonstrates an example of creating a parser using parser_builder
.
Creating a fast parser is very easy.
It may be a little slower, a little faster, or have the same performance as a handwritten one, but the time it takes to create it can be reduced by several times using parser_builder
.
Example of the parser usage #
import 'package:fast_csv/fast_csv.dart' as _fast_csv;
void main(List<String> args) {
final result = _fast_csv.parse(_csv);
print(result.join('\n'));
for (final row in result) {
final car = row[1];
final price = num.parse(row[4]);
print('$car $price');
}
}
const _csv = '''
1997,Ford,E350,"ac, ""abs"", moon",3000.00
1999,Chevy,"Venture В«Extended EditionВ»","",4900.00
1996,Jeep,Grand Cherokee,"MUST SELL! air, moon roof, loaded",4799.00
''';
An example of using a configurable parser #
This parser is slightly slower than the non-configurable parser.
import 'package:fast_csv/fast_csv_ex.dart' as _fast_csv_ex;
void main(List<String> args) {
final result = _fast_csv_ex.parse(_csv, separator: ';');
print(result.join('\n'));
for (final row in result) {
final car = row[1];
final price = num.parse(row[4]);
print('$car $price');
}
}
const _csv = '''
1997;Ford;E350;"ac, ""abs"", moon";3000.00
1999;Chevy;"Venture В«Extended EditionВ»";"";4900.00
1996;Jeep;Grand Cherokee;"MUST SELL! air, moon roof, loaded";4799.00
''';
CSV parser declaration #
tool/build_csv_parser.dart
import 'package:parser_builder/branch.dart';
import 'package:parser_builder/bytes.dart';
import 'package:parser_builder/character.dart';
import 'package:parser_builder/combinator.dart';
import 'package:parser_builder/fast_build.dart';
import 'package:parser_builder/multi.dart';
import 'package:parser_builder/parser_builder.dart';
import 'package:parser_builder/sequence.dart';
import 'package:parser_builder/transformers.dart';
void main(List<String> args) async {
final context = Context();
context.optimizeForSize = false;
final filename = 'lib/fast_csv.dart';
await fastBuild(context, [_parse], filename, header: __header);
}
const __header = r'''
// This code was generated by a tool.
// https://github.com/mezoni/parser_builder
// ignore_for_file: unused_local_variable
import 'package:source_span/source_span.dart';
/// Parses the CSV data and returns the result as a `List<List<String>>`.
/// - Will not parse numbers
/// - The character `,` is used as a field separator
/// - Line endings are `\n`, `\r\n` or `\r`
/// - The start and end of strings is the character `"`
/// - Escaping a character `"` in a string is parsed via sequence `""`
/// - Exception `FormatException` will be thrown if parsing fails
List<List<String>> parse(String source) {
final state = State(source);
final result = _parse(state);
if (!state.ok) {
final errors = Err.errorReport(state.error);
final message = _errorMessage(source, errors);
throw FormatException('\n$message');
}
return result!;
}
''';
const _chars = Named(
'_chars',
Many0(Alt([
NoneOf([0x22]),
Value(0x22, Tag('""')),
])));
const _closeQuote = Named('_closeQuote', Sequence<String>([_quote, _ws]));
const _eof = Named('_eof', Eof<String>());
const _eol = Named('_eol', Tags(['\n', '\r\n', '\r']));
const _field = Named('_field', Alt([_string, _text]));
const _openQuote = Named('_openQuote', Sequence<String>([_ws, _quote]));
const _parse = Named('_parse', Terminated(_rows, _eof));
const _quote = Named('_quote', Tag('"'));
const _row = Named('_row', SeparatedList1(_field, Tag(',')));
const _rowEnding = Named('_rowEnding', Sequence<String>([_eol, Not(_eof)]));
const _rows =
Named('_rows', Terminated(SeparatedList1(_row, _rowEnding), Opt(_eol)));
const _string = Named(
'_string', Delimited(_openQuote, Map$(_chars, _toString), _closeQuote));
const _text = TakeWhile(NotCharClass('[,"] | #xA | #xD'));
const _toString =
ExprTransformer<List<int>, String>('x', 'String.fromCharCodes({{x}})');
const _ws = Named('_ws', SkipWhile(CharClass('#x9 | #x20')));
Performance tests #
The comparison was made with the following CSV parser: csv
.
The files from the resource listed below were used to measure performance (excluding files with format violation).
https://people.sc.fsu.edu/~jburkardt/data/csv/csv.html
Source code for testing procedures.
void _test1(int count) {
for (var i = 0; i < count; i++) {
for (var k = 0; k < _tables.length; k++) {
final table = _tables[k];
final res = CsvToListConverter(
allowInvalid: false, eol: '\n', shouldParseNumbers: false)
.convert(table);
}
}
}
void _test2(int count) {
for (var i = 0; i < count; i++) {
for (var k = 0; k < _tables.length; k++) {
final table = _tables[k];
final res = _fast_csv_ex.parse(table);
}
}
}
void _test3(int count) {
for (var i = 0; i < count; i++) {
for (var k = 0; k < _tables.length; k++) {
final table = _tables[k];
final res = _fast_csv.parse(table);
}
}
}
Results:
List of files:
---------------
test_csv\addresses.csv
test_csv\airtravel.csv
test_csv\biostats.csv
test_csv\cities.csv
test_csv\crash_catalonia.csv
test_csv\deniro.csv
test_csv\example.csv
test_csv\faithful.csv
test_csv\ford_escort.csv
test_csv\freshman_kgs.csv
test_csv\freshman_lbs.csv
test_csv\grades.csv
test_csv\homes.csv
test_csv\hooke.csv
test_csv\hurricanes.csv
test_csv\hw_25000.csv
test_csv\lead_shot.csv
test_csv\letter_frequency.csv
test_csv\news_decline.csv
test_csv\nile.csv
test_csv\oscar_age_female.csv
test_csv\snakes_count_10.csv
test_csv\snakes_count_100.csv
test_csv\snakes_count_1000.csv
test_csv\snakes_count_10000.csv
test_csv\tally_cab.csv
test_csv\taxables.csv
test_csv\trees.csv
test_csv\zillow.csv
---------------
Parse in loop by 5 times:
Results:
Time passed: 0.000, Test 'csv': 3115.923 ms
Time passed: 3.118, Test 'fast_csv_ex': 729.273 ms
Time passed: 3.847, Test 'fast_csv': 643.287 ms
Time passed: 4.490, Test 'csv': 3105.506 ms
Time passed: 7.596, Test 'fast_csv_ex': 693.426 ms
Time passed: 8.289, Test 'fast_csv': 642.53 ms
Time passed: 8.932, Test 'csv': 3039.769 ms
Time passed: 11.972, Test 'fast_csv_ex': 717.888 ms
Time passed: 12.690, Test 'fast_csv': 639.85 ms
Time passed: 13.330, Test 'csv': 3030.294 ms
Time passed: 16.360, Test 'fast_csv_ex': 709.727 ms
Time passed: 17.070, Test 'fast_csv': 616.216 ms
Time passed: 17.686, Test 'csv': 3100.673 ms
Time passed: 20.787, Test 'fast_csv_ex': 717.872 ms
Time passed: 21.505, Test 'fast_csv': 623.422 ms