gabrielreid take 2
Clear up some TODOS, simplify the code a bit, which appears to result in a 25% performance increase.
This commit is contained in:
parent
a8a3876416
commit
08af2622d3
@ -22,10 +22,10 @@ import java.io.FileInputStream;
|
|||||||
import java.io.IOException;
|
import java.io.IOException;
|
||||||
import java.nio.charset.StandardCharsets;
|
import java.nio.charset.StandardCharsets;
|
||||||
import java.util.Arrays;
|
import java.util.Arrays;
|
||||||
|
import java.util.HashMap;
|
||||||
import java.util.Locale;
|
import java.util.Locale;
|
||||||
|
import java.util.Map;
|
||||||
import java.util.Objects;
|
import java.util.Objects;
|
||||||
import java.util.SortedMap;
|
|
||||||
import java.util.TreeMap;
|
|
||||||
import java.util.concurrent.CompletableFuture;
|
import java.util.concurrent.CompletableFuture;
|
||||||
import java.util.concurrent.ForkJoinPool;
|
import java.util.concurrent.ForkJoinPool;
|
||||||
import java.util.concurrent.LinkedBlockingDeque;
|
import java.util.concurrent.LinkedBlockingDeque;
|
||||||
@ -45,12 +45,13 @@ public class CalculateAverage_gabrielreid {
|
|||||||
|
|
||||||
private static final int BLOCK_READ_SIZE = 1024 * 1024 * 16;
|
private static final int BLOCK_READ_SIZE = 1024 * 1024 * 16;
|
||||||
private static final int SUMMARY_TABLE_SIZE = 2048;
|
private static final int SUMMARY_TABLE_SIZE = 2048;
|
||||||
|
private static final int MAP_INITIAL_SIZE = 450;
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* State with the full summary table, as well as leftover bytes between processed blocks that need to
|
* State with the full summary table, as well as leftover bytes between processed blocks that need to
|
||||||
* be handled afterward.
|
* be handled afterward.
|
||||||
*/
|
*/
|
||||||
record State(SummaryTable summaryTable, byte[] remainderBytes) {
|
record State(Map<String, CitySummary> map, byte[] remainderBytes) {
|
||||||
}
|
}
|
||||||
|
|
||||||
public static void main(String[] args) throws IOException {
|
public static void main(String[] args) throws IOException {
|
||||||
@ -63,7 +64,7 @@ public class CalculateAverage_gabrielreid {
|
|||||||
}
|
}
|
||||||
try (var fjp = new ForkJoinPool(numCores)) {
|
try (var fjp = new ForkJoinPool(numCores)) {
|
||||||
|
|
||||||
CompletableFuture<State> stateFuture = CompletableFuture.completedFuture(new State(new SummaryTable(SUMMARY_TABLE_SIZE), new byte[0]));
|
CompletableFuture<State> stateFuture = CompletableFuture.completedFuture(new State(new HashMap<>(MAP_INITIAL_SIZE), new byte[0]));
|
||||||
|
|
||||||
try (var fis = new FileInputStream("./measurements.txt")) {
|
try (var fis = new FileInputStream("./measurements.txt")) {
|
||||||
var blockBuilder = Objects.requireNonNull(blockBuilderQueue.poll());
|
var blockBuilder = Objects.requireNonNull(blockBuilderQueue.poll());
|
||||||
@ -77,7 +78,7 @@ public class CalculateAverage_gabrielreid {
|
|||||||
skipToNewline = true;
|
skipToNewline = true;
|
||||||
stateFuture = stateFuture.thenCombine(
|
stateFuture = stateFuture.thenCombine(
|
||||||
CompletableFuture.supplyAsync(() -> {
|
CompletableFuture.supplyAsync(() -> {
|
||||||
var summaryTable = localBlockBuilder.buildSummaryTable(localCnt, localSkipToNewline);
|
var summaryMap = localBlockBuilder.buildSummaryTable(localCnt, localSkipToNewline);
|
||||||
|
|
||||||
int unprocessedRemainderSize = localBlockBuilder.firstLineStart + (localCnt - localBlockBuilder.lastLineEnd);
|
int unprocessedRemainderSize = localBlockBuilder.firstLineStart + (localCnt - localBlockBuilder.lastLineEnd);
|
||||||
var unprocessedBytes = new byte[unprocessedRemainderSize];
|
var unprocessedBytes = new byte[unprocessedRemainderSize];
|
||||||
@ -87,20 +88,20 @@ public class CalculateAverage_gabrielreid {
|
|||||||
|
|
||||||
localBlockBuilder.reset();
|
localBlockBuilder.reset();
|
||||||
blockBuilderQueue.add(localBlockBuilder);
|
blockBuilderQueue.add(localBlockBuilder);
|
||||||
return new State(summaryTable, unprocessedBytes);
|
return new State(summaryMap, unprocessedBytes);
|
||||||
}, fjp), (state, newState) -> {
|
}, fjp), (state, newState) -> {
|
||||||
state.summaryTable.addAll(newState.summaryTable);
|
newState.map.forEach(
|
||||||
|
(k, v) -> state.map.merge(k, v, CitySummary::add));
|
||||||
|
|
||||||
var newRemainderBytes = new byte[state.remainderBytes.length + newState.remainderBytes.length];
|
var newRemainderBytes = new byte[state.remainderBytes.length + newState.remainderBytes.length];
|
||||||
System.arraycopy(state.remainderBytes, 0, newRemainderBytes, 0, state.remainderBytes.length);
|
System.arraycopy(state.remainderBytes, 0, newRemainderBytes, 0, state.remainderBytes.length);
|
||||||
System.arraycopy(newState.remainderBytes, 0, newRemainderBytes, state.remainderBytes.length, newState.remainderBytes.length);
|
System.arraycopy(newState.remainderBytes, 0, newRemainderBytes, state.remainderBytes.length, newState.remainderBytes.length);
|
||||||
return new State(state.summaryTable, newRemainderBytes);
|
return new State(state.map, newRemainderBytes);
|
||||||
});
|
});
|
||||||
|
|
||||||
try {
|
try {
|
||||||
blockBuilder = blockBuilderQueue.poll(1, TimeUnit.HOURS);
|
blockBuilder = blockBuilderQueue.poll(1, TimeUnit.HOURS);
|
||||||
}
|
} catch (InterruptedException e) {
|
||||||
catch (InterruptedException e) {
|
|
||||||
Thread.currentThread().interrupt();
|
Thread.currentThread().interrupt();
|
||||||
throw new RuntimeException(e);
|
throw new RuntimeException(e);
|
||||||
}
|
}
|
||||||
@ -109,33 +110,38 @@ public class CalculateAverage_gabrielreid {
|
|||||||
}
|
}
|
||||||
|
|
||||||
stateFuture = stateFuture.thenApply(state -> {
|
stateFuture = stateFuture.thenApply(state -> {
|
||||||
BlockBuilder blockBuilder = null;
|
BlockBuilder blockBuilder;
|
||||||
try {
|
try {
|
||||||
blockBuilder = blockBuilderQueue.poll(1, TimeUnit.HOURS);
|
blockBuilder = blockBuilderQueue.poll(1, TimeUnit.HOURS);
|
||||||
}
|
} catch (InterruptedException e) {
|
||||||
catch (InterruptedException e) {
|
|
||||||
Thread.currentThread().interrupt();
|
Thread.currentThread().interrupt();
|
||||||
throw new RuntimeException(e);
|
throw new RuntimeException(e);
|
||||||
}
|
}
|
||||||
System.arraycopy(state.remainderBytes, 0, blockBuilder.readBuffer, 0, state.remainderBytes.length);
|
System.arraycopy(state.remainderBytes, 0, blockBuilder.readBuffer, 0, state.remainderBytes.length);
|
||||||
state.summaryTable.addAll(blockBuilder.buildSummaryTable(state.remainderBytes.length, false));
|
|
||||||
return new State(state.summaryTable, new byte[0]);
|
var m = blockBuilder.buildSummaryTable(state.remainderBytes.length, false);
|
||||||
|
m.forEach(
|
||||||
|
(k, v) -> state.map.merge(k, v, CitySummary::add));
|
||||||
|
return new State(state.map, new byte[0]);
|
||||||
});
|
});
|
||||||
|
|
||||||
var state = stateFuture.join();
|
var state = stateFuture.join();
|
||||||
System.out.println(state.summaryTable.toOutputString());
|
System.out.println(STR."{\{state.map.entrySet().stream().sorted(Map.Entry.comparingByKey())
|
||||||
}
|
.map(e -> String.format(Locale.US, "%s=%.1f/%.1f/%.1f", e.getKey(), e.getValue().min / 10f,
|
||||||
}
|
(e.getValue().sum / (float) e.getValue().count) / 10f, e.getValue().max / 10f))
|
||||||
|
.collect(Collectors.joining(", "))}}");
|
||||||
|
|
||||||
|
}}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* Parses number values as integers from the byte array.
|
* Parses number values as integers from the byte array.
|
||||||
* <p>
|
* <p>
|
||||||
* The multiplier is 1 if positive and -1 if negative.
|
* The multiplier is 1 if positive and -1 if negative.
|
||||||
*/
|
*/
|
||||||
static short parseNumFromLine(byte[] buf, int offset, int len, int multiplier) {
|
static short parseNumFromLine(byte[] buf, int offset, int len) {
|
||||||
return switch (len) {
|
return switch (len) {
|
||||||
case 3 -> (short) ((((buf[offset] - '0') * 10) + buf[offset + 2] - '0') * multiplier);
|
case 3 -> (short) ((((buf[offset] - '0') * 10) + buf[offset + 2] - '0'));
|
||||||
case 4 -> (short) ((((buf[offset] - '0') * 100) + (buf[offset + 1] - '0') * 10 + buf[offset + 3] - '0') * multiplier);
|
case 4 -> (short) ((((buf[offset] - '0') * 100) + (buf[offset + 1] - '0') * 10 + buf[offset + 3] - '0'));
|
||||||
default -> throw new IllegalStateException("Unexpected number length %d".formatted(len));
|
default -> throw new IllegalStateException("Unexpected number length %d".formatted(len));
|
||||||
};
|
};
|
||||||
}
|
}
|
||||||
@ -163,11 +169,12 @@ public class CalculateAverage_gabrielreid {
|
|||||||
this.count++;
|
this.count++;
|
||||||
}
|
}
|
||||||
|
|
||||||
void add(CitySummary other) {
|
CitySummary add(CitySummary other) {
|
||||||
this.max = Math.max(other.max, this.max);
|
this.max = Math.max(other.max, this.max);
|
||||||
this.min = Math.min(other.min, this.min);
|
this.min = Math.min(other.min, this.min);
|
||||||
this.sum += other.sum;
|
this.sum += other.sum;
|
||||||
this.count += other.count;
|
this.count += other.count;
|
||||||
|
return this;
|
||||||
}
|
}
|
||||||
|
|
||||||
}
|
}
|
||||||
@ -180,43 +187,35 @@ public class CalculateAverage_gabrielreid {
|
|||||||
static final class ByteSlice {
|
static final class ByteSlice {
|
||||||
|
|
||||||
private final byte[] buf;
|
private final byte[] buf;
|
||||||
private int offset;
|
private final int offset;
|
||||||
private int len;
|
private final int len;
|
||||||
private int hash;
|
|
||||||
|
|
||||||
public ByteSlice(byte[] buf) {
|
public ByteSlice(byte[] buf, int offset, int len) {
|
||||||
this.buf = buf;
|
this.buf = buf;
|
||||||
}
|
this.offset = offset;
|
||||||
|
this.len = len;
|
||||||
public static ByteSlice clone(ByteSlice src) {
|
|
||||||
var bytes = new byte[src.len];
|
|
||||||
System.arraycopy(src.buf, src.offset, bytes, 0, src.len);
|
|
||||||
var copy = new ByteSlice(bytes);
|
|
||||||
copy.offset = 0;
|
|
||||||
copy.len = src.len;
|
|
||||||
copy.hash = src.hash;
|
|
||||||
return copy;
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
|
||||||
public String toString() {
|
|
||||||
return "ByteSlice[%s]".formatted(new String(this.buf, this.offset, this.len, StandardCharsets.UTF_8));
|
|
||||||
}
|
}
|
||||||
|
|
||||||
public String valueAsString() {
|
public String valueAsString() {
|
||||||
return new String(this.buf, this.offset, this.len, StandardCharsets.UTF_8);
|
return new String(this.buf, this.offset, this.len, StandardCharsets.UTF_8);
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
|
||||||
public int hashCode() {
|
public int hashCode() {
|
||||||
return this.hash;
|
return hashCode(this.buf, this.offset, this.len);
|
||||||
}
|
}
|
||||||
|
|
||||||
public int calculateHashCode() {
|
public static int hashCode(byte[] buf, int offset, int len) {
|
||||||
int result = 1;
|
int result = 1;
|
||||||
int end = offset + len;
|
int i = 0;
|
||||||
for (int i = offset; i < end; i++) {
|
for (; i + 3 < len; i += 4) {
|
||||||
result = 31 * result + buf[i];
|
result = 31 * 31 * 31 * 31 * result
|
||||||
|
+ 31 * 31 * 31 * buf[offset + i]
|
||||||
|
+ 31 * 31 * buf[offset + i + 1]
|
||||||
|
+ 31 * buf[offset + i + 2]
|
||||||
|
+ buf[offset + i + 3];
|
||||||
|
}
|
||||||
|
for (; i < len; i++) {
|
||||||
|
result = 31 * result + buf[offset + i];
|
||||||
}
|
}
|
||||||
return result;
|
return result;
|
||||||
}
|
}
|
||||||
@ -230,87 +229,119 @@ public class CalculateAverage_gabrielreid {
|
|||||||
}
|
}
|
||||||
|
|
||||||
public static boolean equal(ByteSlice a, ByteSlice b) {
|
public static boolean equal(ByteSlice a, ByteSlice b) {
|
||||||
return a.hash == b.hash && Arrays.equals(a.buf, a.offset, a.offset + a.len, b.buf, b.offset, b.offset + b.len);
|
return Arrays.equals(a.buf, a.offset, a.offset + a.len, b.buf, b.offset, b.offset + b.len);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
public static boolean equal(ByteSlice a, byte[] buf, int offset, int len) {
|
||||||
|
return Arrays.equals(a.buf, a.offset, a.offset + a.len, buf, offset, offset + len);
|
||||||
|
}
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
record ValueNode(ByteSlice byteSlice, CitySummary citySummary) {
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
static final class SummaryTable {
|
static final class SummaryTable {
|
||||||
|
|
||||||
|
private static final int LOAD_FACTOR = 4;
|
||||||
|
|
||||||
private int size;
|
private int size;
|
||||||
private ByteSlice[] keys;
|
private ValueNode[] values;
|
||||||
private CitySummary[] values;
|
|
||||||
private int valueCount;
|
private int valueCount;
|
||||||
|
private int resizeThreshold;
|
||||||
|
|
||||||
|
private byte[] localBufferBytes = new byte[MAP_INITIAL_SIZE * 100];
|
||||||
|
private int localBufferPtr = 0;
|
||||||
|
|
||||||
SummaryTable(int size) {
|
SummaryTable(int size) {
|
||||||
this.size = size;
|
this.size = size;
|
||||||
this.keys = new ByteSlice[size];
|
this.values = new ValueNode[size];
|
||||||
this.values = new CitySummary[size];
|
this.resizeThreshold = size / LOAD_FACTOR;
|
||||||
|
}
|
||||||
|
|
||||||
|
void reset() {
|
||||||
|
for (int i = 0; i < size; i++) {
|
||||||
|
this.values[i] = null;
|
||||||
|
}
|
||||||
|
localBufferPtr = 0;
|
||||||
}
|
}
|
||||||
|
|
||||||
public void addAll(SummaryTable other) {
|
public void addAll(SummaryTable other) {
|
||||||
for (int i = 0; i < other.size; i++) {
|
for (int i = 0; i < other.size; i++) {
|
||||||
var otherSlice = other.keys[i];
|
var otherSlice = other.values[i];
|
||||||
if (otherSlice != null) {
|
if (otherSlice != null) {
|
||||||
putCitySummary(otherSlice, other.values[i]);
|
putValueNode(otherSlice);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
private void putCitySummary(ByteSlice key, CitySummary value) {
|
private void putValueNode(ValueNode valueNode) {
|
||||||
resizeIfNecessary();
|
int hashCode = valueNode.byteSlice.hashCode();
|
||||||
int index = (key.hash & 0x7FFFFFFF) % size;
|
int index = (hashCode & 0x7FFFFFFF) % size;
|
||||||
while (keys[index] != null) {
|
while (values[index] != null) {
|
||||||
if (ByteSlice.equal(keys[index], key)) {
|
if (ByteSlice.equal(values[index].byteSlice, valueNode.byteSlice)) {
|
||||||
values[index].add(value);
|
values[index].citySummary.add(valueNode.citySummary);
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
// TODO Consider secondary hash for the stride here
|
index = (index + (hashCode & 0xFF) + 1) % size;
|
||||||
index = (index + 1) % size;
|
|
||||||
}
|
}
|
||||||
keys[index] = key;
|
values[index] = valueNode;
|
||||||
values[index] = value;
|
|
||||||
valueCount++;
|
valueCount++;
|
||||||
|
resizeIfNecessary();
|
||||||
}
|
}
|
||||||
|
|
||||||
public void putTemperatureValue(ByteSlice key, int value) {
|
public void putTemperatureValue(byte[] buf, int offset, int len, int value) {
|
||||||
resizeIfNecessary();
|
|
||||||
int index = (key.hash & 0x7FFFFFFF) % size;
|
int hashCode = ByteSlice.hashCode(buf, offset, len);
|
||||||
while (keys[index] != null) {
|
int index = (hashCode & 0x7FFFFFFF) % size;
|
||||||
if (ByteSlice.equal(keys[index], key)) {
|
while (values[index] != null) {
|
||||||
values[index].add(value);
|
if (ByteSlice.equal(values[index].byteSlice, buf, offset, len)) {
|
||||||
|
values[index].citySummary.add(value);
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
// TODO Consider secondary hash for the stride here
|
index = (index + (hashCode & 0xFF) + 1) % size;
|
||||||
// System.out.println("Collision!");
|
|
||||||
index = (index + 1) % size;
|
|
||||||
}
|
}
|
||||||
keys[index] = ByteSlice.clone(key);
|
|
||||||
values[index] = new CitySummary(value);
|
System.arraycopy(buf, offset, this.localBufferBytes, this.localBufferPtr, len);
|
||||||
|
var byteSlice = new ByteSlice(this.localBufferBytes, this.localBufferPtr, len);
|
||||||
|
var valueNode = new ValueNode(byteSlice, new CitySummary(value));
|
||||||
|
localBufferPtr += len;
|
||||||
|
|
||||||
|
values[index] = valueNode;
|
||||||
valueCount++;
|
valueCount++;
|
||||||
|
resizeIfNecessary();
|
||||||
}
|
}
|
||||||
|
|
||||||
private void resizeIfNecessary() {
|
private void resizeIfNecessary() {
|
||||||
if (valueCount == size) {
|
if (valueCount >= resizeThreshold) {
|
||||||
var resized = new SummaryTable(size * 2);
|
int newSize = size * 2;
|
||||||
|
var resized = new SummaryTable(newSize);
|
||||||
|
for (int i = 0; i < this.size; i++) {
|
||||||
|
if (this.values[i] != null) {
|
||||||
|
resized.putValueNode(this.values[i]);
|
||||||
|
}
|
||||||
|
}
|
||||||
resized.addAll(this);
|
resized.addAll(this);
|
||||||
this.keys = resized.keys;
|
byte[] localBufferBytes = new byte[this.localBufferBytes.length * 2];
|
||||||
|
System.arraycopy(this.localBufferBytes, 0, localBufferBytes, 0, this.localBufferPtr);
|
||||||
this.values = resized.values;
|
this.values = resized.values;
|
||||||
this.size = resized.size;
|
this.size = newSize;
|
||||||
this.valueCount = resized.valueCount;
|
this.valueCount = resized.valueCount;
|
||||||
|
this.resizeThreshold = newSize / LOAD_FACTOR;
|
||||||
|
this.localBufferBytes = localBufferBytes;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
public String toOutputString() {
|
public Map<String, CitySummary> toMap() {
|
||||||
SortedMap<String, CitySummary> m = new TreeMap<>();
|
HashMap<String, CitySummary> m = HashMap.newHashMap(valueCount);
|
||||||
for (int i = 0; i < size; i++) {
|
for (int i = 0; i < size; i++) {
|
||||||
ByteSlice slice = keys[i];
|
var valueNode = this.values[i];
|
||||||
if (slice != null) {
|
if (valueNode != null) {
|
||||||
m.put(slice.valueAsString(), values[i]);
|
m.put(valueNode.byteSlice.valueAsString(), valueNode.citySummary);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
return "{" + m.entrySet().stream().map(e -> String.format(Locale.US, "%s=%.1f/%.1f/%.1f", e.getKey(), e.getValue().min / 10f,
|
return m;
|
||||||
(e.getValue().sum / (float) e.getValue().count) / 10f, e.getValue().max / 10f)).collect(Collectors.joining(", ")) + "}";
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -319,79 +350,26 @@ public class CalculateAverage_gabrielreid {
|
|||||||
*/
|
*/
|
||||||
static class BlockBuilder {
|
static class BlockBuilder {
|
||||||
final byte[] readBuffer;
|
final byte[] readBuffer;
|
||||||
private final int numSegmentLengths;
|
private final SummaryTable summaryTable;
|
||||||
private final byte[] segmentLengths;
|
|
||||||
private final int[] hashCodes;
|
|
||||||
private final short[] temperatureValues;
|
|
||||||
private final ByteSlice byteSlice;
|
|
||||||
|
|
||||||
private int firstLineStart;
|
private int firstLineStart;
|
||||||
private int lastLineEnd;
|
private int lastLineEnd;
|
||||||
private int lineCount;
|
|
||||||
|
|
||||||
public BlockBuilder(int readBufferSize) {
|
public BlockBuilder(int readBufferSize) {
|
||||||
this.readBuffer = new byte[readBufferSize];
|
this.readBuffer = new byte[readBufferSize];
|
||||||
// TODO This sizing is almost certainly non-optimal, but it seems to work
|
this.summaryTable = new SummaryTable(SUMMARY_TABLE_SIZE);
|
||||||
this.numSegmentLengths = readBufferSize / 2;
|
|
||||||
this.segmentLengths = new byte[numSegmentLengths];
|
|
||||||
this.hashCodes = new int[numSegmentLengths];
|
|
||||||
this.temperatureValues = new short[numSegmentLengths];
|
|
||||||
this.byteSlice = new ByteSlice(this.readBuffer);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void reset() {
|
void reset() {
|
||||||
firstLineStart = -1;
|
firstLineStart = -1;
|
||||||
lastLineEnd = -1;
|
lastLineEnd = -1;
|
||||||
lineCount = 0;
|
this.summaryTable.reset();
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
public SummaryTable buildSummaryTable(int readByteCount, boolean skipToNewline) {
|
public Map<String, CitySummary> buildSummaryTable(int readByteCount, boolean skipToNewline) {
|
||||||
|
|
||||||
parseLineSegments(readByteCount, skipToNewline);
|
parseLineSegments(readByteCount, skipToNewline);
|
||||||
calculateHashesAndTemperatures();
|
return summaryTable.toMap();
|
||||||
|
|
||||||
SummaryTable summaryTable = new SummaryTable(SUMMARY_TABLE_SIZE);
|
|
||||||
|
|
||||||
this.byteSlice.offset = this.firstLineStart;
|
|
||||||
|
|
||||||
int segmentCount = lineCount * 2;
|
|
||||||
int lineCounter = 0;
|
|
||||||
for (int segmentIdx = 0; segmentIdx < segmentCount; segmentIdx += 2) {
|
|
||||||
// TODO It would likely be better if this ByteSlice was just a view on the arrays
|
|
||||||
this.byteSlice.len = this.segmentLengths[segmentIdx];
|
|
||||||
this.byteSlice.hash = this.hashCodes[lineCounter];
|
|
||||||
summaryTable.putTemperatureValue(this.byteSlice, this.temperatureValues[lineCounter]);
|
|
||||||
this.byteSlice.offset += (this.segmentLengths[segmentIdx] + (this.segmentLengths[segmentIdx + 1] & 0b01111111) + 2);
|
|
||||||
lineCounter++;
|
|
||||||
}
|
|
||||||
|
|
||||||
return summaryTable;
|
|
||||||
|
|
||||||
}
|
|
||||||
|
|
||||||
private void calculateHashesAndTemperatures() {
|
|
||||||
this.byteSlice.offset = this.firstLineStart;
|
|
||||||
|
|
||||||
int segmentCount = lineCount * 2;
|
|
||||||
int lineCounter = 0;
|
|
||||||
for (int segmentIdx = 0; segmentIdx < segmentCount; segmentIdx += 2) {
|
|
||||||
// TODO It would likely be better if this ByteSlice was just a view on the arrays
|
|
||||||
this.byteSlice.len = this.segmentLengths[segmentIdx];
|
|
||||||
this.hashCodes[lineCounter++] = this.byteSlice.calculateHashCode();
|
|
||||||
this.byteSlice.offset += (this.segmentLengths[segmentIdx] + (this.segmentLengths[segmentIdx + 1] & 0b01111111) + 2);
|
|
||||||
}
|
|
||||||
|
|
||||||
// TODO It might be better/faster to do this in the previous loop instead of second loop
|
|
||||||
lineCounter = 0;
|
|
||||||
int offset = this.firstLineStart + this.segmentLengths[0] + 1;
|
|
||||||
for (int segmentIdx = 1; segmentIdx < segmentCount; segmentIdx += 2) {
|
|
||||||
byte segmentLength = this.segmentLengths[segmentIdx];
|
|
||||||
var isNeg = (byte) (segmentLength >> 7);
|
|
||||||
int numLength = (segmentLength & 0b01111111) + isNeg;
|
|
||||||
short temperatureValue = parseNumFromLine(this.readBuffer, offset - isNeg, numLength, (isNeg * 2) + 1);
|
|
||||||
this.temperatureValues[lineCounter++] = temperatureValue;
|
|
||||||
offset += -isNeg + numLength + this.segmentLengths[segmentIdx + 1] + 2;
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
|
|
||||||
private void parseLineSegments(int byteCount, boolean skipToNewline) {
|
private void parseLineSegments(int byteCount, boolean skipToNewline) {
|
||||||
@ -406,22 +384,23 @@ public class CalculateAverage_gabrielreid {
|
|||||||
}
|
}
|
||||||
|
|
||||||
this.firstLineStart = idx;
|
this.firstLineStart = idx;
|
||||||
this.lineCount = 0;
|
|
||||||
int segmentCounter = 0;
|
|
||||||
int lineStart = idx;
|
int lineStart = idx;
|
||||||
|
|
||||||
while (idx < upperBound && lineCount < numSegmentLengths) {
|
while (idx < upperBound) {
|
||||||
var byteVector = ByteVector.fromArray(BYTE_SPECIES, readBuffer, idx);
|
var byteVector = ByteVector.fromArray(BYTE_SPECIES, readBuffer, idx);
|
||||||
var newlineByteMask = byteVector.eq(NEWLINE_BYTE);
|
var newlineIdx = byteVector.eq(NEWLINE_BYTE).firstTrue();
|
||||||
if (newlineByteMask.anyTrue()) {
|
if (newlineIdx < BYTE_SPECIES_LEN) {
|
||||||
var semicolonByteMask = byteVector.eq(SEMICOLON_BYTE);
|
var semicolonByteMask = byteVector.eq(SEMICOLON_BYTE);
|
||||||
var semicolonIdx = semicolonByteMask.firstTrue();
|
var semicolonIdx = semicolonByteMask.firstTrue();
|
||||||
|
|
||||||
int semicolonOffset = idx + semicolonIdx;
|
int semicolonOffset = idx + semicolonIdx;
|
||||||
int lineEnd = idx + newlineByteMask.firstTrue();
|
int lineEnd = idx + newlineIdx;
|
||||||
byte negMult = (byte) ((readBuffer[idx + semicolonIdx + 1] == NEG_BYTE) ? 0b10000000 : 0);
|
short negative = (short) ((readBuffer[idx + semicolonIdx + 1] == NEG_BYTE) ? 1 : 0);
|
||||||
this.segmentLengths[segmentCounter++] = (byte) (semicolonOffset - lineStart);
|
int numLength = (byte) ((lineEnd - (semicolonOffset + 1)));
|
||||||
this.segmentLengths[segmentCounter++] = (byte) ((lineEnd - (semicolonOffset + 1)) | negMult);
|
var num = parseNumFromLine(this.readBuffer, semicolonOffset + 1 + negative, numLength - negative);
|
||||||
this.lineCount++;
|
num = negative == 1 ? (short) -num : num;
|
||||||
|
int nameLen = semicolonOffset - lineStart;
|
||||||
|
summaryTable.putTemperatureValue(this.readBuffer, lineStart, nameLen, num);
|
||||||
idx = lineEnd + 1;
|
idx = lineEnd + 1;
|
||||||
lastLineEnd = idx;
|
lastLineEnd = idx;
|
||||||
lineStart = idx;
|
lineStart = idx;
|
||||||
@ -439,19 +418,19 @@ public class CalculateAverage_gabrielreid {
|
|||||||
}
|
}
|
||||||
if (readBuffer[idx] == NEWLINE_BYTE) {
|
if (readBuffer[idx] == NEWLINE_BYTE) {
|
||||||
int lineEnd = idx;
|
int lineEnd = idx;
|
||||||
byte negMult = (byte) ((readBuffer[semicolonIdx + 1] == NEG_BYTE) ? 0b10000000 : 0);
|
|
||||||
this.segmentLengths[segmentCounter++] = (byte) (semicolonIdx - lineStart);
|
short negative = (short) ((readBuffer[semicolonIdx + 1] == NEG_BYTE) ? 1 : 0);
|
||||||
this.segmentLengths[segmentCounter++] = (byte) ((lineEnd - (semicolonIdx + 1)) | negMult);
|
int numLength = (byte) ((lineEnd - (semicolonIdx + 1)));
|
||||||
this.lineCount++;
|
var num = parseNumFromLine(this.readBuffer, semicolonIdx + 1 + negative, numLength - negative);
|
||||||
|
num = negative == 1 ? (short) -num : num;
|
||||||
|
int nameLen = semicolonIdx - lineStart;
|
||||||
|
summaryTable.putTemperatureValue(this.readBuffer, lineStart, nameLen, num);
|
||||||
idx = lineEnd + 1;
|
idx = lineEnd + 1;
|
||||||
lastLineEnd = idx;
|
lastLineEnd = idx;
|
||||||
lineStart = idx;
|
lineStart = idx;
|
||||||
}
|
}
|
||||||
idx++;
|
idx++;
|
||||||
}
|
}
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
}
|
}
|
||||||
|
Loading…
Reference in New Issue
Block a user