-
Notifications
You must be signed in to change notification settings - Fork 0
/
Program.cs
115 lines (94 loc) · 5.02 KB
/
Program.cs
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
// Copyright 2020 Heath Stewart.
// Licensed under the MIT License. See LICENSE.txt in the project root for license information.
using System;
using System.Collections.Generic;
using System.Reflection;
using System.Text.RegularExpressions;
using BenchmarkDotNet.Attributes;
using BenchmarkDotNet.Running;
namespace Utils
{
[MemoryDiagnoser]
[MarkdownExporterAttribute.GitHub]
public class Program
{
private static readonly Regex _separatorsRe = new Regex(@"[\ ,\.\n]", RegexOptions.Compiled);
private static readonly Regex _separatorsReAll = new Regex(@"[\ ,\.\n]+", RegexOptions.Compiled);
private static readonly char[] _separators = new[] { ' ', ',', '.', '\n' };
static void Main(string[] args)
{
var summary = BenchmarkSwitcher.FromAssembly(Assembly.GetExecutingAssembly()).Run(args);
}
[Params(StringSplitOptions.None, StringSplitOptions.RemoveEmptyEntries)]
public StringSplitOptions Options { get; set; }
[ParamsSource(nameof(GetText))]
public string Text { get; set; }
public IEnumerable<string> GetText => new[]
{
"Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod tempor incididunt ut labore et dolore magna aliqua.",
"Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam, quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non proident, sunt in culpa qui officia deserunt mollit anim id est laborum.",
"Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam, quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat non proident, sunt in culpa qui officia deserunt mollit anim id est laborum.\nCurabitur pretium tincidunt lacus. Nulla gravida orci a odio. Nullam varius, turpis et commodo pharetra, est eros bibendum elit, nec luctus magna felis sollicitudin mauris. Integer in mauris eu nibh euismod gravida. Duis ac tellus et risus vulputate vehicula. Donec lobortis risus a elit. Etiam tempor. Ut ullamcorper, ligula eu tempor congue, eros est euismod turpis, id tincidunt sapien risus a quam. Maecenas fermentum consequat mi. Donec fermentum. Pellentesque malesuada nulla a mi. Duis sapien sem, aliquet nec, commodo eget, consequat quis, neque. Aliquam faucibus, elit ut dictum aliquet, felis nisl adipiscing sapien, sed malesuada diam lacus eget erat. Cras mollis scelerisque nunc. Nullam arcu. Aliquam consequat. Curabitur augue lorem, dapibus quis, laoreet et, pretium ac, nisi. Aenean magna nisl, mollis quis, molestie eu, feugiat in, orci. In hac habitasse platea dictumst.",
};
[Benchmark(Baseline = true)]
public int UsingString()
{
string[] tokens = Text.Split(_separators, Options);
int count = 0;
foreach (string token in tokens)
{
string value = token.Trim();
count++;
}
return count;
}
[Benchmark]
public int UsingStringTokenizer()
{
StringTokenizer tokenizer = new StringTokenizer(Text, _separators, Options);
int count = 0;
foreach (StringSegment segment in tokenizer)
{
StringSegment value = segment.Trim();
count++;
}
return count;
}
[Benchmark]
public int UsingUnsafeStringTokenizer()
{
StringTokenizer tokenizer = new StringTokenizer(Text, _separators, Options);
int count = 0;
StringTokenizer.Enumerator e = tokenizer.GetEnumerator();
while (e.MoveNext())
{
StringSegment segment = e.Current;
StringSegment value = segment.UnsafeTrim();
count++;
}
return count;
}
[Benchmark]
public int UsingStringTokenizerSpans()
{
StringTokenizer tokenizer = new StringTokenizer(Text, _separators, Options);
int count = 0;
foreach (StringSegment segment in tokenizer)
{
ReadOnlySpan<char> value = segment.AsSpan().Trim();
count++;
}
return count;
}
[Benchmark]
public int UsingRegularExpressions()
{
Regex re = Options == StringSplitOptions.RemoveEmptyEntries ? _separatorsReAll : _separatorsRe;
int count = 0;
foreach (string token in re.Split(Text))
{
count++;
}
return count;
}
}
}