CalculateAverage_faridtmammadov (#406)
* create calculate average frd * rename to mach github username * add licesnce header * make script executable --------- Co-authored-by: Farid Mammadov <farid.mammadov@simbrella.com>
This commit is contained in:
parent
b7c24f95cd
commit
07ac6a53c3
21
calculate_average_faridtmammadov.sh
Executable file
21
calculate_average_faridtmammadov.sh
Executable file
@ -0,0 +1,21 @@
|
||||
#!/bin/sh
|
||||
#
|
||||
# Copyright 2023 The original authors
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
#
|
||||
|
||||
|
||||
JAVA_OPTS="--enable-preview"
|
||||
java $JAVA_OPTS --class-path target/average-1.0.0-SNAPSHOT.jar dev.morling.onebrc.CalculateAverage_faridtmammadov
|
||||
|
@ -0,0 +1,203 @@
|
||||
/*
|
||||
* Copyright 2023 The original authors
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
package dev.morling.onebrc;
|
||||
|
||||
import java.io.ByteArrayOutputStream;
|
||||
import java.io.IOException;
|
||||
import java.lang.foreign.Arena;
|
||||
import java.lang.foreign.MemorySegment;
|
||||
import java.lang.foreign.ValueLayout;
|
||||
import java.nio.channels.FileChannel;
|
||||
import java.nio.charset.StandardCharsets;
|
||||
import java.nio.file.Path;
|
||||
import java.nio.file.StandardOpenOption;
|
||||
import java.util.ArrayList;
|
||||
import java.util.HashMap;
|
||||
import java.util.List;
|
||||
import java.util.Map;
|
||||
import java.util.TreeMap;
|
||||
import java.util.stream.Collectors;
|
||||
|
||||
public class CalculateAverage_faridtmammadov {
|
||||
private static final String FILE = "./measurements.txt";
|
||||
|
||||
public static void main(String[] args) throws IOException {
|
||||
int availableProcessors = Runtime.getRuntime().availableProcessors();
|
||||
|
||||
var map = getSegments(availableProcessors).stream()
|
||||
.map(CalculateAverage_faridtmammadov::aggregate).parallel()
|
||||
.flatMap(f -> f.entrySet().stream())
|
||||
.collect(Collectors.toMap(Map.Entry::getKey, Map.Entry::getValue, Aggregate::update, TreeMap::new));
|
||||
|
||||
printFormatted(map);
|
||||
}
|
||||
|
||||
private static List<MemorySegment> getSegments(int numberOfChunks) throws IOException {
|
||||
try (var fileChannel = FileChannel.open(Path.of(FILE), StandardOpenOption.READ)) {
|
||||
var fileSize = fileChannel.size();
|
||||
var segmentSize = fileSize / numberOfChunks;
|
||||
var segment = fileChannel.map(FileChannel.MapMode.READ_ONLY, 0, fileSize, Arena.global());
|
||||
var baseAddress = segment.address();
|
||||
var endAddress = baseAddress + fileSize;
|
||||
var segments = new ArrayList<MemorySegment>();
|
||||
var startAddress = baseAddress;
|
||||
|
||||
for (var i = 0; i < numberOfChunks; i++) {
|
||||
var pointer = startAddress + segmentSize;
|
||||
while (pointer < endAddress) {
|
||||
long offset = pointer - baseAddress;
|
||||
byte b = segment.get(ValueLayout.JAVA_BYTE, offset);
|
||||
if (b == '\n') {
|
||||
break;
|
||||
}
|
||||
pointer++;
|
||||
}
|
||||
if (pointer >= endAddress) {
|
||||
var offsetStart = startAddress - baseAddress;
|
||||
var offsetEnd = endAddress - baseAddress - offsetStart;
|
||||
segments.add(segment.asSlice(offsetStart, offsetEnd));
|
||||
break;
|
||||
}
|
||||
var offsetStart = startAddress - baseAddress;
|
||||
var offsetEnd = pointer - baseAddress - offsetStart;
|
||||
segments.add(segment.asSlice(offsetStart, offsetEnd));
|
||||
startAddress = pointer + 1;
|
||||
}
|
||||
|
||||
return segments;
|
||||
}
|
||||
}
|
||||
|
||||
private static Map<String, Aggregate> aggregate(MemorySegment segment) {
|
||||
var map = new HashMap<String, Aggregate>();
|
||||
var iterator = new MemorySegmentIterator(segment);
|
||||
|
||||
while (iterator.hasNext()) {
|
||||
String city = parseCity(iterator);
|
||||
long temperature = parseTemperature(iterator);
|
||||
|
||||
map.compute(city, (key, value) -> {
|
||||
if (value == null) {
|
||||
return new Aggregate(temperature);
|
||||
}
|
||||
else {
|
||||
return value.update(temperature);
|
||||
}
|
||||
});
|
||||
}
|
||||
|
||||
return map;
|
||||
}
|
||||
|
||||
private static String parseCity(MemorySegmentIterator iterator) {
|
||||
var byteStream = new ByteArrayOutputStream();
|
||||
while (iterator.hasNext()) {
|
||||
var b = iterator.getNextByte();
|
||||
if (b == ';') {
|
||||
return byteStream.toString(StandardCharsets.UTF_8);
|
||||
}
|
||||
byteStream.write(b);
|
||||
}
|
||||
|
||||
return null;
|
||||
}
|
||||
|
||||
public static long parseTemperature(MemorySegmentIterator iterator) {
|
||||
long value = 0L;
|
||||
int sign = 1;
|
||||
while (iterator.hasNext()) {
|
||||
byte b = iterator.getNextByte();
|
||||
if (b >= '0' && b <= '9') {
|
||||
value = value * 10 + b - '0';
|
||||
}
|
||||
else if (b == '\n') {
|
||||
return value * sign;
|
||||
}
|
||||
else if (b == '-') {
|
||||
sign = -1;
|
||||
}
|
||||
}
|
||||
|
||||
return value * sign;
|
||||
}
|
||||
|
||||
private static void printFormatted(Map<String, Aggregate> map) {
|
||||
var iterator = map.entrySet().iterator();
|
||||
var length = map.entrySet().size();
|
||||
System.out.print("{");
|
||||
for (int i = 0; i < length - 1; i++) {
|
||||
var entry = iterator.next();
|
||||
System.out.printf("%s=%s, ", entry.getKey(), entry.getValue().toString());
|
||||
}
|
||||
var lastEntry = iterator.next();
|
||||
System.out.printf("%s=%s}\n", lastEntry.getKey(), lastEntry.getValue().toString());
|
||||
}
|
||||
|
||||
static class Aggregate {
|
||||
long min;
|
||||
long max;
|
||||
long sum;
|
||||
int count;
|
||||
|
||||
public Aggregate(long temperature) {
|
||||
min = temperature;
|
||||
max = temperature;
|
||||
sum = temperature;
|
||||
count = 1;
|
||||
}
|
||||
|
||||
public Aggregate update(long temp) {
|
||||
min = Math.min(min, temp);
|
||||
max = Math.max(max, temp);
|
||||
sum += temp;
|
||||
count++;
|
||||
return this;
|
||||
}
|
||||
|
||||
public Aggregate update(Aggregate agg) {
|
||||
min = Math.min(min, agg.min);
|
||||
max = Math.max(max, agg.max);
|
||||
sum += agg.sum;
|
||||
count += agg.count;
|
||||
return this;
|
||||
}
|
||||
|
||||
public String toString() {
|
||||
return String.format("%s/%s/%s", min / 10.0f, Math.round(sum * 1.0f / count) / 10.0f, max / 10.0f);
|
||||
}
|
||||
}
|
||||
|
||||
static class MemorySegmentIterator {
|
||||
private long offset;
|
||||
private final MemorySegment segment;
|
||||
private final long segmentSize;
|
||||
|
||||
public MemorySegmentIterator(MemorySegment segment) {
|
||||
this.segment = segment;
|
||||
this.segmentSize = segment.byteSize();
|
||||
}
|
||||
|
||||
public boolean hasNext() {
|
||||
return offset < segmentSize;
|
||||
}
|
||||
|
||||
public byte getNextByte() {
|
||||
var b = segment.get(ValueLayout.JAVA_BYTE, offset);
|
||||
offset++;
|
||||
return b;
|
||||
}
|
||||
}
|
||||
}
|
Loading…
Reference in New Issue
Block a user