use scopes to allow to use mutex without arc
apply clippy to my implementations
This commit is contained in:
parent
a3b6075b6a
commit
1193ada82d
@ -1,76 +1,84 @@
|
|||||||
use std::{
|
use std::{
|
||||||
fs::File,
|
fs::File,
|
||||||
io::{BufRead, BufReader},
|
io::{BufRead, BufReader},
|
||||||
sync::{Arc, Mutex},
|
sync::{Mutex},
|
||||||
thread,
|
thread,
|
||||||
};
|
};
|
||||||
use std::collections::HashMap;
|
use std::collections::HashMap;
|
||||||
use std::time::Instant;
|
use std::time::Instant;
|
||||||
|
use onebrc::format_nums;
|
||||||
|
|
||||||
const DEFAULT_HASHMAP_LENGTH: usize = 10000;
|
const DEFAULT_HASHMAP_LENGTH: usize = 10000;
|
||||||
|
|
||||||
fn main() {
|
fn main() {
|
||||||
let now = Instant::now();
|
print!("\x1b[2J");
|
||||||
let stations: Arc<Mutex<HashMap<String, onebrc::StationMeasurements>>> =
|
let stations:Mutex<HashMap<String, onebrc::StationMeasurements>> =
|
||||||
Arc::new(Mutex::new(HashMap::with_capacity(DEFAULT_HASHMAP_LENGTH)));
|
Mutex::new(HashMap::with_capacity(DEFAULT_HASHMAP_LENGTH));
|
||||||
|
thread::scope(|s| {
|
||||||
|
// Doing this allows us to not "move" stations into the closure
|
||||||
|
// and remove the necessity for reference counting (Arc)
|
||||||
|
// no performance improvement but less complex
|
||||||
|
let stations = &stations;
|
||||||
|
let now = Instant::now();
|
||||||
|
|
||||||
let cores: usize = thread::available_parallelism().unwrap().into();
|
let cores: usize = thread::available_parallelism().unwrap().into();
|
||||||
|
|
||||||
let chunk_length = 1_000_000_000 / cores;
|
let chunk_length = 1_000_000_000 / cores;
|
||||||
let mut handles = vec![];
|
for i in 0..cores {
|
||||||
for i in 0..cores {
|
let file = File::open("../../../measurements.txt").expect("File measurements.txt not found");
|
||||||
let file = File::open("../../../measurements.txt").expect("File measurements.txt not found");
|
let reader = BufReader::new(file);
|
||||||
let reader = BufReader::new(file);
|
let line_chunk = reader.lines().skip(chunk_length * i).take(chunk_length);
|
||||||
let line_chunk = reader.lines().skip(chunk_length * i).take(chunk_length);
|
s.spawn(move || {
|
||||||
let stations_clone = stations.clone();
|
let mut t_stations: HashMap<String, onebrc::StationMeasurements> =
|
||||||
let handle = thread::spawn(move || {
|
HashMap::with_capacity(DEFAULT_HASHMAP_LENGTH);
|
||||||
let mut t_stations: HashMap<String, onebrc::StationMeasurements> =
|
|
||||||
HashMap::with_capacity(DEFAULT_HASHMAP_LENGTH);
|
|
||||||
|
|
||||||
let now_read_line = Instant::now();
|
let now_read_line = Instant::now();
|
||||||
println!("Start reading lines in thread {i}");
|
let print_line = i + 1;
|
||||||
line_chunk.for_each(|line| {
|
let mut line_num = 0;
|
||||||
let line = line.expect("could not read line");
|
line_chunk.for_each(|line| {
|
||||||
let (station, temp) = line.split_once(';').expect("Error while splitting");
|
if line_num == 0 {
|
||||||
let temp = onebrc::parse_temp(temp.as_bytes());
|
print!("\x1b[{print_line};30HStart read line {}ms", now_read_line.elapsed().as_millis());
|
||||||
let measurements_option = t_stations.get_mut(station);
|
}
|
||||||
if let Some(measurements) = measurements_option {
|
if line_num % 10000 == 0 {
|
||||||
measurements.update(temp);
|
let formatted = format_nums(line_num);
|
||||||
} else {
|
print!("\x1b[{print_line};0HThread #{i:0>2}: {formatted}");
|
||||||
let measurements = onebrc::StationMeasurements {
|
}
|
||||||
min: temp,
|
line_num += 1;
|
||||||
max: temp,
|
let line = line.expect("could not read line");
|
||||||
count: 1,
|
let (station, temp) = line.split_once(';').expect("Error while splitting");
|
||||||
sum: temp,
|
let temp = onebrc::parse_temp(temp.as_bytes());
|
||||||
};
|
let measurements_option = t_stations.get_mut(station);
|
||||||
t_stations.insert(station.to_owned(), measurements);
|
if let Some(measurements) = measurements_option {
|
||||||
|
measurements.update(temp);
|
||||||
|
} else {
|
||||||
|
let measurements = onebrc::StationMeasurements {
|
||||||
|
min: temp,
|
||||||
|
max: temp,
|
||||||
|
count: 1,
|
||||||
|
sum: temp,
|
||||||
|
};
|
||||||
|
t_stations.insert(station.to_owned(), measurements);
|
||||||
|
}
|
||||||
|
});
|
||||||
|
print!("\x1b[{print_line};60HTime reading lines in thread {i}={} ms", now_read_line.elapsed().as_millis());
|
||||||
|
for (station, measurements) in t_stations.iter() {
|
||||||
|
let mut stations_guard = stations.lock().expect("Error while locking");
|
||||||
|
let joined_measurements_options = stations_guard.get_mut(station.as_str());
|
||||||
|
if let Some(joined_measurements) = joined_measurements_options {
|
||||||
|
joined_measurements.merge(measurements);
|
||||||
|
} else {
|
||||||
|
stations_guard.insert(station.to_owned(), *measurements);
|
||||||
|
}
|
||||||
}
|
}
|
||||||
});
|
});
|
||||||
println!("Time reading lines in thread {i}={} μs", now_read_line.elapsed().as_micros());
|
}
|
||||||
let now_insert_line = Instant::now();
|
let mut stations: Vec<String> = stations.lock().unwrap().iter().map(|(station, measurements)| {
|
||||||
println!("Start inserting lines in thread {i}");
|
let measurements = measurements.to_string();
|
||||||
for (station, measurements) in t_stations.iter() {
|
format!("{station}={measurements}")
|
||||||
let mut stations_guard = stations_clone.lock().expect("Error while locking");
|
}).collect();
|
||||||
let joined_measurements_options = stations_guard.get_mut(station.as_str());
|
stations.sort();
|
||||||
if let Some(joined_measurements) = joined_measurements_options {
|
let _stations = stations.join(",");
|
||||||
joined_measurements.merge(measurements);
|
// println!("{{{stations}}}");
|
||||||
} else {
|
println!("\n\nTime={} ms", now.elapsed().as_millis());
|
||||||
stations_guard.insert(station.to_owned(), *measurements);
|
});
|
||||||
}
|
|
||||||
}
|
|
||||||
println!("Time inserting lines in thread {i}={} μs", now_insert_line.elapsed().as_micros());
|
|
||||||
});
|
|
||||||
handles.push(handle);
|
|
||||||
}
|
|
||||||
for handle in handles {
|
|
||||||
handle.join().unwrap();
|
|
||||||
}
|
|
||||||
let mut stations: Vec<String> = stations.lock().unwrap().iter().map(|(&ref station, &ref measurements)| {
|
|
||||||
let measurements = measurements.to_string();
|
|
||||||
format!("{station}={measurements}")
|
|
||||||
}).collect();
|
|
||||||
stations.sort();
|
|
||||||
let stations = stations.join(",");
|
|
||||||
println!("{{{stations}}}");
|
|
||||||
println!("Time={} μs", now.elapsed().as_micros());
|
|
||||||
}
|
}
|
||||||
|
@ -32,7 +32,7 @@ fn main() {
|
|||||||
stations.insert(station.to_owned(), measurements);
|
stations.insert(station.to_owned(), measurements);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
let mut stations: Vec<String> = stations.iter().map(|(&ref station, &ref measurements)| {
|
let mut stations: Vec<String> = stations.iter().map(|(station, measurements)| {
|
||||||
let measurements = measurements.to_string();
|
let measurements = measurements.to_string();
|
||||||
format!("{station}={measurements}")
|
format!("{station}={measurements}")
|
||||||
}).collect();
|
}).collect();
|
||||||
|
Loading…
Reference in New Issue
Block a user