1
  2
  3
  4
  5
  6
  7
  8
  9
 10
 11
 12
 13
 14
 15
 16
 17
 18
 19
 20
 21
 22
 23
 24
 25
 26
 27
 28
 29
 30
 31
 32
 33
 34
 35
 36
 37
 38
 39
 40
 41
 42
 43
 44
 45
 46
 47
 48
 49
 50
 51
 52
 53
 54
 55
 56
 57
 58
 59
 60
 61
 62
 63
 64
 65
 66
 67
 68
 69
 70
 71
 72
 73
 74
 75
 76
 77
 78
 79
 80
 81
 82
 83
 84
 85
 86
 87
 88
 89
 90
 91
 92
 93
 94
 95
 96
 97
 98
 99
100
101
102
103
104
105
106
107
108
109
use crate::{ReadText, ReadTextLayered, TextStr, TextString, WriteText};
use layered_io::Bufferable;
use std::{cmp::max, io};

/// Like `std::io::copy`, but for streams that can operate directly on text
/// strings, so we can avoid re-validating them as text.
pub fn copy_text<R: ReadText + Bufferable + ?Sized, W: WriteText + Bufferable + ?Sized>(
    reader: &mut R,
    writer: &mut W,
) -> io::Result<u64> {
    // TODO: Avoid unnecessary zero-initialization.
    let mut buf = unsafe {
        TextString::from_text_unchecked(" ".repeat(max(
            reader.suggested_buffer_size(),
            writer.suggested_buffer_size(),
        )))
    };

    let mut written = 0;
    loop {
        let len = match reader.read_text(&mut buf) {
            Ok(0) => break,
            Ok(nread) => nread,
            Err(err) if err.kind() == io::ErrorKind::Interrupted => continue,
            Err(err) => return Err(err),
        };
        // TODO: Implement `Index` for `TextStr`?
        writer.write_text(TextStr::from_text(&buf.as_utf8()[..len]).unwrap())?;
        written += len as u64;
    }
    Ok(written)
}

/// Like `std::io::copy`, but for streams that can operate directly on text
/// strings, so we can avoid re-validating them as text.
///
/// Also, like `copy_text`, but uses `read_text_with_status` to avoid performing
/// an extra `read` at the end.
pub fn copy_text_using_status<R: ReadTextLayered + ?Sized, W: WriteText + Bufferable + ?Sized>(
    reader: &mut R,
    writer: &mut W,
) -> io::Result<u64> {
    // TODO: Avoid unnecessary zero-initialization.
    let mut buf = TextString::from_text(" ".repeat(max(
        reader.suggested_buffer_size(),
        writer.suggested_buffer_size(),
    )))
    .unwrap();

    let mut written = 0;
    loop {
        let (len, status) = reader.read_text_with_status(&mut buf)?;
        // TODO: Implement `Index` for `TextStr`?
        writer.write_text(TextStr::from_text(&buf.as_utf8()[..len]).unwrap())?;
        written += len as u64;
        if status.is_end() {
            return Ok(written);
        }
        if status.is_push() {
            writer.flush()?;
        }
    }
}

#[test]
fn test_copy_text() {
    use crate::{TextReader, TextStr, TextWriter};
    use layered_io::{LayeredReader, LayeredWriter};
    use std::{io::Cursor, str};
    use utf8_io::{Utf8Reader, Utf8Writer};

    let text = "hello world ☃\n";
    let mut input = TextReader::new(Utf8Reader::new(LayeredReader::new(Cursor::new(
        text.to_string(),
    ))));
    let mut output = TextWriter::new(Utf8Writer::new(LayeredWriter::new(Vec::new())));

    copy_text(&mut input, &mut output).unwrap();

    let ext = output.close_into_inner().unwrap();
    let vec = ext.abandon_into_inner().abandon_into_inner().unwrap();
    let s = str::from_utf8(&vec).unwrap();
    assert_eq!(s, text);
    let t = TextStr::from_text(s).unwrap();
    assert_eq!(t, text);
}

#[test]
fn test_copy_text_using_status() {
    use crate::{TextReader, TextStr, TextWriter};
    use layered_io::{LayeredReader, LayeredWriter};
    use std::{io::Cursor, str};
    use utf8_io::{Utf8Reader, Utf8Writer};

    let text = "hello world ☃";
    let mut input = TextReader::new(Utf8Reader::new(LayeredReader::new(Cursor::new(
        text.to_string(),
    ))));
    let mut output = TextWriter::new(Utf8Writer::new(LayeredWriter::new(Vec::new())));

    copy_text_using_status(&mut input, &mut output).unwrap();

    let ext = output.close_into_inner().unwrap();
    let vec = ext.abandon_into_inner().abandon_into_inner().unwrap();
    let s = str::from_utf8(&vec).unwrap();
    assert_eq!(s, &format!("{}\n", text));
    let t = TextStr::from_text(s).unwrap();
    assert_eq!(t, &format!("{}\n", text));
}