Last active
September 10, 2021 21:09
-
-
Save hyrmn/a8a45408d1e2073de7b1f1c09c761925 to your computer and use it in GitHub Desktop.
Surprisingly slower
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
static unsafe int CountLines(FileStream file) | |
{ | |
var count = 0; | |
var vectorSize = 256 / 8; //256 bits, 8 bits in a byte. | |
var maskSrc = stackalloc byte[vectorSize]; | |
var scratch = stackalloc byte[vectorSize]; | |
for (var i = 0; i < vectorSize; i++) | |
{ | |
maskSrc[i] = Rune; | |
} | |
var runeMask = Avx2.LoadVector256(maskSrc); | |
var zero = Vector256<byte>.Zero; | |
var accumulator = Vector256<long>.Zero; | |
long bytesRead = 0; | |
var fileSize = file.Length; | |
int read; | |
var buffer = new byte[BufferSize]; | |
while (bytesRead < fileSize) | |
{ | |
read = file.Read(buffer, 0, BufferSize); | |
bytesRead += read; | |
int i; | |
fixed (byte* ptr = buffer) | |
{ | |
for (i = 0; i <= read - vectorSize; i += vectorSize) | |
{ | |
var v = Avx2.LoadVector256(ptr + i); | |
var masked = Avx2.CompareEqual(v, runeMask); | |
var pop = Avx2.Subtract(zero, masked); | |
for (var el = 0; el < vectorSize; el++) | |
{ | |
count += pop.GetElement(el); | |
} | |
} | |
} | |
} | |
return count; | |
} |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
using System.Numerics; | |
namespace nlc; | |
public class LineCounter | |
{ | |
public const int BufferSize = 128 * 1024; | |
private const byte rune = (byte)'\n'; | |
private static readonly Vector<byte> mask = new(rune); | |
public uint CountLines(Stream stream) | |
{ | |
int read; | |
int idxOf; | |
int vectorSize = Vector<byte>.Count; | |
var buffer = new Span<byte>(new byte[BufferSize]); | |
uint count = 0; | |
while ((read = stream.Read(buffer)) > 0) | |
{ | |
int i; | |
for (i = 0; i <= read - vectorSize; i += vectorSize) | |
{ | |
var v = new Vector<byte>(buffer.Slice(i, vectorSize)); | |
count += Vector.Dot(-Vector.Equals(v, mask), Vector<byte>.One); | |
} | |
if(i < read) | |
{ | |
var slice = buffer.Slice(i, read - i); | |
while ((idxOf = slice.IndexOf(rune)) > -1) | |
{ | |
slice = slice.Slice(idxOf + 1); | |
count++; | |
} | |
} | |
} | |
return count; | |
} | |
} |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment
Try this