From cd92518d1be7daaf169160834393c9d0a23f3e82 Mon Sep 17 00:00:00 2001 From: Leandro Fernandes Vieira Date: Sat, 21 Oct 2023 14:33:37 -0300 Subject: [PATCH] done! --- .../VariableLengthReaderRawExtensions.cs | 121 +++++++----------- 1 file changed, 47 insertions(+), 74 deletions(-) diff --git a/RecordParser/Extensions/FileReader/VariableLengthReaderRawExtensions.cs b/RecordParser/Extensions/FileReader/VariableLengthReaderRawExtensions.cs index 741d5e7..04f7359 100644 --- a/RecordParser/Extensions/FileReader/VariableLengthReaderRawExtensions.cs +++ b/RecordParser/Extensions/FileReader/VariableLengthReaderRawExtensions.cs @@ -1,6 +1,6 @@ -using RecordParser.Engines; -using RecordParser.Engines.Reader; +using RecordParser.Builders.Reader; using RecordParser.Extensions.FileReader.RowReaders; +using RecordParser.Parsers; using System; using System.Buffers; using System.Collections.Generic; @@ -12,7 +12,6 @@ namespace RecordParser.Extensions.FileReader { public delegate string StringPool(ReadOnlySpan text); - internal delegate void Get(ref TextFindHelper finder, string[] inst, StringPool cache); public class VariableLengthReaderRawOptions { @@ -59,39 +58,6 @@ public class VariableLengthReaderRawOptions public static class VariableLengthReaderRawExtensions { - private static Get BuildRaw(int collumnCount, bool hasTransform, bool trim) - { - var configParameter = Expression.Parameter(typeof(TextFindHelper).MakeByRefType(), "config"); - var instanceVariable = Expression.Parameter(typeof(string[]), "inst"); - var cacheParameter = Expression.Parameter(typeof(StringPool), "cache"); - - var commands = new Expression[collumnCount]; - for (int i = 0; i < collumnCount; i++) - { - var arrayAccessExpr = Expression.ArrayAccess(instanceVariable, Expression.Constant(i)); - var getValue = (Expression)Expression.Call(configParameter, nameof(TextFindHelper.GetValue), Type.EmptyTypes, Expression.Constant(i)); - - if (trim) - getValue = Expression.Call(typeof(MemoryExtensions), "Trim", Type.EmptyTypes, getValue); - - if (hasTransform) - { - getValue = Expression.Invoke(cacheParameter, getValue); - } - else - { - getValue = Expression.Call(getValue, "ToString", Type.EmptyTypes); - } - - commands[i] = Expression.Assign(arrayAccessExpr, getValue); - } - - var block = Expression.Block(commands); - var final = Expression.Lambda(block, configParameter, instanceVariable, cacheParameter); - - return final.Compile(); - } - /// /// Reads the records from a variable length file, then parses each record /// to object by accessing each field's value by index. @@ -105,41 +71,28 @@ private static Get BuildRaw(int collumnCount, bool hasTransform, bool trim) /// public static IEnumerable ReadRecordsRaw(this TextReader reader, VariableLengthReaderRawOptions options, Func, T> parser) { - var get = BuildRaw(options.ColumnCount, options.StringPoolFactory != null, options.Trim); - var sep = options.Separator; - Func func = options.ContainsQuotedFields - ? () => new RowByQuote(reader, Length, sep) - : () => new RowByLine(reader, Length); + ? () => new RowByQuote(reader, Length, options.Separator) + : () => new RowByLine(reader, Length); var parallelOptions = options.ParallelismOptions ?? new(); return parallelOptions.Enabled - ? GetParallel() - : GetSequential(); + ? GetParallel() + : GetSequential(); IEnumerable GetSequential() { var buffer = new string[options.ColumnCount]; - var stringCache = options.StringPoolFactory?.Invoke(); + var reader = BuildReader(options.Separator, options.ColumnCount, options.Trim, () => buffer, options.StringPoolFactory); var getField = (int i) => buffer[i]; return ReadRecordsSequential(Parser, func, options.HasHeader); T Parser(ReadOnlyMemory memory, int i) { - var finder = new TextFindHelper(memory.Span, sep, QuoteHelper.Quote); - - try - { - get(ref finder, buffer, stringCache); - - return parser(getField); - } - finally - { - finder.Dispose(); - } + reader.Parse(memory.Span); + return parser(getField); } } @@ -151,14 +104,14 @@ IEnumerable GetParallel() .Range(0, maxParallelism) .Select(_ => { - var buf = new string[options.ColumnCount]; + var buffer = new string[options.ColumnCount]; return new { - buffer = buf, + buffer, lockObj = new object(), - stringCache = options.StringPoolFactory?.Invoke(), - getField = new Func(i => buf[i]) + reader = BuildReader(options.Separator, options.ColumnCount, options.Trim, () => buffer, options.StringPoolFactory), + getField = new Func(i => buffer[i]), }; }) .ToArray(); @@ -167,24 +120,44 @@ IEnumerable GetParallel() T Parser(ReadOnlyMemory memory, int i) { - var finder = new TextFindHelper(memory.Span, sep, QuoteHelper.Quote); - - try - { - var r = funcs[i % maxParallelism]; - lock (r.lockObj) - { - get(ref finder, r.buffer, r.stringCache); - - return parser(r.getField); - } - } - finally + var r = funcs[i % maxParallelism]; + lock (r.lockObj) { - finder.Dispose(); + r.reader.Parse(memory.Span); + return parser(r.getField); } } } } + + private static IVariableLengthReader BuildReader(string separator, int columnCount, bool trim, Func factory, Func poolFactory) + { + var builder = new VariableLengthReaderSequentialBuilder(); + + for (var i = 0; i < columnCount; i++) + builder.Map(buildExpression(i)); + + if (poolFactory != null) + { + var pool = poolFactory(); + builder.DefaultTypeConvert(trim + ? x => pool(x.Trim()) + : x => pool(x)); + } + + var reader = builder.Build(separator, factory: factory); + + return reader; + + // builds the lambda: array => array[i] + static Expression> buildExpression(int i) + { + var arrayExpr = Expression.Parameter(typeof(string[])); + var indexExpr = Expression.Constant(i); + var arrayAccessExpr = Expression.ArrayAccess(arrayExpr, indexExpr); + + return Expression.Lambda>(arrayAccessExpr, arrayExpr); + } + } } }