mirror of
https://github.com/twitter/the-algorithm.git
synced 2024-12-23 02:31:52 +01:00
33 lines
1.0 KiB
Rust
33 lines
1.0 KiB
Rust
use npyz::WriterBuilder;
|
|
use npyz::{AutoSerialize, WriteOptions};
|
|
use std::io::BufWriter;
|
|
use std::{
|
|
fs::File,
|
|
io::{self, BufRead},
|
|
};
|
|
|
|
pub fn load_batch_prediction_request_base64(file_name: &str) -> Vec<Vec<u8>> {
|
|
let file = File::open(file_name).expect("could not read file");
|
|
let mut result = vec![];
|
|
for (mut line_count, line) in io::BufReader::new(file).lines().enumerate() {
|
|
line_count += 1;
|
|
match base64::decode(line.unwrap().trim()) {
|
|
Ok(payload) => result.push(payload),
|
|
Err(err) => println!("error decoding line {file_name}:{line_count} - {err}"),
|
|
}
|
|
}
|
|
println!("result len: {}", result.len());
|
|
result
|
|
}
|
|
|
|
pub fn save_to_npy<T: npyz::Serialize + AutoSerialize>(data: &[T], save_to: String) {
|
|
let mut writer = WriteOptions::new()
|
|
.default_dtype()
|
|
.shape(&[data.len() as u64, 1])
|
|
.writer(BufWriter::new(File::create(save_to).unwrap()))
|
|
.begin_nd()
|
|
.unwrap();
|
|
writer.extend(data.to_owned()).unwrap();
|
|
writer.finish().unwrap();
|
|
}
|