FastWaveBackend/src/vcd/reader.rs

98 lines
3.1 KiB
Rust
Raw Normal View History

2022-06-03 16:06:20 +00:00
use std::fs::File;
use std::collections::VecDeque;
use std::slice;
use std::str;
use std::io::prelude::*;
use std::io;
2022-07-26 01:16:15 +00:00
#[derive(Debug, Clone)]
2022-07-20 02:05:00 +00:00
pub(super) struct Line(pub(super) usize);
2022-07-26 01:16:15 +00:00
#[derive(Debug, Clone)]
2022-07-20 02:05:00 +00:00
pub(super) struct Word(pub(super) usize);
2022-07-26 01:16:15 +00:00
#[derive(Debug, Clone)]
2022-07-20 02:05:00 +00:00
pub(super) struct Cursor(pub(super) Line, pub(super) Word);
2022-06-03 16:06:20 +00:00
pub struct WordReader {
reader : io::BufReader<File>,
2022-08-02 23:31:35 +00:00
eof : bool,
2022-06-03 16:06:20 +00:00
buffers : Vec<String>,
curr_line : usize,
str_slices : VecDeque<(*const u8, usize, Cursor)>,
2022-07-26 01:16:15 +00:00
curr_slice : Option<(*const u8, usize, Cursor)>,
2022-06-03 16:06:20 +00:00
}
impl WordReader {
2022-07-13 00:02:45 +00:00
pub(super) fn new(file : File) -> WordReader {
2022-08-02 23:31:35 +00:00
let reader = io::BufReader::new(file);
2022-06-03 16:06:20 +00:00
WordReader {
reader : reader,
2022-08-02 23:31:35 +00:00
eof : false,
2022-06-03 16:06:20 +00:00
buffers : vec![],
curr_line : 0,
2022-07-26 01:16:15 +00:00
str_slices : VecDeque::new(),
curr_slice : None
2022-06-03 16:06:20 +00:00
}
}
2022-07-13 00:02:45 +00:00
pub(super) fn next_word(&mut self) -> Option<(&str, Cursor)> {
2022-06-03 16:06:20 +00:00
// if there are no more words, attempt to read more content
// from the file
if self.str_slices.is_empty() {
self.buffers.clear();
2022-08-02 23:31:35 +00:00
if self.eof {return None}
2022-06-03 16:06:20 +00:00
let num_buffers = 10;
for buf_idx in 0..num_buffers {
self.buffers.push(String::new());
self.curr_line += 1;
let bytes_read = self.reader.read_line(&mut self.buffers[buf_idx]).unwrap();
// if we've reached the end of the file on the first attempt to read
// a line in this for loop, no further attempts are necessary and we
if bytes_read == 0 {
2022-08-02 23:31:35 +00:00
self.eof = true;
2022-06-03 16:06:20 +00:00
break;
}
2022-08-02 23:31:35 +00:00
let words = self.buffers[buf_idx].split_ascii_whitespace();
2022-06-03 16:06:20 +00:00
for word in words.enumerate() {
let (word_idx, word) = word;
let position = Cursor(Line(self.curr_line), Word(word_idx + 1));
self.str_slices.push_back((word.as_ptr(), word.len(), position))
}
}
}
// if after we've attempted to read in more content from the file,
// there are still no words...
if self.str_slices.is_empty() {
return None
}
// if we make it here, we return the next word
unsafe {
let (ptr, len, position) = self.str_slices.pop_front().unwrap();
let slice = slice::from_raw_parts(ptr, len);
2022-07-26 01:16:15 +00:00
self.curr_slice = Some((ptr, len, position.clone()));
2022-06-03 16:06:20 +00:00
return Some((str::from_utf8(slice).unwrap(), position));
};
}
2022-07-26 01:16:15 +00:00
pub(super) fn curr_word(&mut self) -> Option<(&str, Cursor)> {
match &self.curr_slice {
Some(slice) => {
unsafe {
let (ptr, len, position) = slice.clone();
let slice = slice::from_raw_parts(ptr, len);
Some((str::from_utf8(slice).unwrap(), position))
}
}
None => {None}
}
}
2022-06-03 16:06:20 +00:00
}