1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
use anyhow::Result;
use std::io::{BufRead, BufReader, Read, stdin};
use std::fs::File;
use std::sync::mpsc::{self, Sender, Receiver};
use std::thread::{self, JoinHandle};
use crate::Joinable;
use encoding_rs_io::DecodeReaderBytesBuilder;
#[cfg(feature = "gzip")]
use flate2::read::GzDecoder;
pub struct BodyfileReader {
worker: Option<JoinHandle<()>>,
rx: Option<Receiver<String>>
}
enum BodyfileSource {
Stdin,
File(Box<dyn Read + Send>),
}
fn worker<R: Read + Send>(input: R, tx: Sender<String>) {
let mut line_ctr = 1;
let drb = DecodeReaderBytesBuilder::new()
.encoding(Some(encoding_rs::UTF_8))
.utf8_passthru(true)
.build(input);
let mut reader = BufReader::new(drb);
loop {
let mut line = String::new();
let size = reader.read_line(&mut line);
match size {
Err(why) => {
eprintln!("IO Error in line {}: {:?}", line_ctr, why);
break;
}
Ok(s) => {
if s == 0 { break; }
if let Err(_) = tx.send(line) {
break;
}
}
}
line_ctr += 1;
}
}
impl BodyfileReader {
pub fn from(filename: &Option<String>) -> Result<Self> {
let input = match filename {
None => BodyfileSource::Stdin,
Some(filename) => {
if filename == "-" { BodyfileSource::Stdin }
else {
let file = File::open(filename)?;
#[cfg(not(feature = "gzip"))]
let reader: Box<dyn BufRead> = Box::new(file);
#[cfg(feature = "gzip")]
let reader = Self::open_gzip(filename, file);
BodyfileSource::File(reader)
}
}
};
let (tx, rx): (Sender<String>, Receiver<String>) = mpsc::channel();
let worker = match input {
BodyfileSource::Stdin => thread::spawn(move || {worker(stdin(), tx);}),
BodyfileSource::File(f) => thread::spawn(move || {worker(f, tx);}),
};
Ok(Self {
worker: Some(worker),
rx: Some(rx)
})
}
#[cfg(feature = "gzip")]
fn open_gzip(filename: &str, file: File) -> Box<dyn Read + Send> {
if filename.ends_with(".gz") {
Box::new(GzDecoder::new(file))
} else {
Box::new(file)
}
}
pub fn get_receiver(&mut self) -> Receiver<String> {
self.rx.take().unwrap()
}
}
impl Joinable<()> for BodyfileReader {
fn join(&mut self) -> std::thread::Result<()> {
self.worker.take().unwrap().join()
}
}