Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Add unicode handling capability #106

Open
wants to merge 6 commits into
base: main
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
14 changes: 14 additions & 0 deletions examples/cat.rs
Original file line number Diff line number Diff line change
@@ -0,0 +1,14 @@
use rexpect::error::Error;
use rexpect::spawn;

fn main() -> Result<(), Error> {
let mut p = spawn("cat", Some(1000))?;

let ex: String = "∀".to_string();
p.send_line(&ex)?;
let line = p.read_line()?;

println!("In: {}", &ex);
println!("Out: {}", &line);
Ok(())
}
7 changes: 7 additions & 0 deletions src/encoding.rs
Original file line number Diff line number Diff line change
@@ -0,0 +1,7 @@
#[derive(Debug, PartialEq, Eq, Clone, Copy, Default)]
#[allow(non_snake_case)]
pub enum Encoding {
ASCII,
#[default]
UTF8,
}
2 changes: 2 additions & 0 deletions src/lib.rs
Original file line number Diff line number Diff line change
Expand Up @@ -64,11 +64,13 @@
//! }
//! ```

pub mod encoding;
pub mod error;
pub mod process;
pub mod reader;
pub mod session;

pub use encoding::Encoding;
pub use reader::ReadUntil;
pub use session::{spawn, spawn_bash, spawn_python, spawn_stream, spawn_with_options};

Expand Down
43 changes: 42 additions & 1 deletion src/reader.rs
Original file line number Diff line number Diff line change
@@ -1,5 +1,6 @@
//! Unblocking reader which supports waiting for strings/regexes and EOF to be present

use crate::encoding::Encoding;
use crate::error::Error;
pub use regex::Regex;
use std::io::prelude::*;
Expand Down Expand Up @@ -108,6 +109,7 @@ pub fn find(needle: &ReadUntil, buffer: &str, eof: bool) -> Option<(usize, usize
pub struct Options {
pub timeout_ms: Option<u64>,
pub strip_ansi_escape_codes: bool,
pub encoding: Encoding,
}

/// Non blocking reader
Expand All @@ -120,6 +122,7 @@ pub struct NBReader {
buffer: String,
eof: bool,
timeout: Option<time::Duration>,
encoding: Encoding,
}

impl NBReader {
Expand Down Expand Up @@ -174,6 +177,7 @@ impl NBReader {
buffer: String::with_capacity(1024),
eof: false,
timeout: options.timeout_ms.map(time::Duration::from_millis),
encoding: options.encoding,
}
}

Expand All @@ -182,9 +186,22 @@ impl NBReader {
if self.eof {
return Ok(());
}
// NOTE: When UTF-8 mode is on, there is no handling to salvage a
// stream of chars if a broken unicode char is not completed.
let mut char_buf: Vec<u8> = Vec::new();

while let Ok(from_channel) = self.reader.try_recv() {
match from_channel {
Ok(PipedChar::Char(c)) => self.buffer.push(c as char),
Ok(PipedChar::Char(c)) => match &self.encoding {
Encoding::ASCII => self.buffer.push(c as char),
Encoding::UTF8 => {
char_buf.push(c);
if let Ok(s) = std::str::from_utf8(&char_buf) {
self.buffer.push(s.chars().next().unwrap());
char_buf.clear();
}
}
},
Ok(PipedChar::EOF) => self.eof = true,
// this is just from experience, e.g. "sleep 5" returns the other error which
// most probably means that there is no stdout stream at all -> send EOF
Expand Down Expand Up @@ -321,6 +338,28 @@ mod tests {
Err(_) => panic!(),
}
}
#[test]
fn test_expect_unicode() {
let f = io::Cursor::new("∀ melon\r\n");
let mut r = NBReader::new(
f,
Options {
encoding: Encoding::UTF8,
..Default::default()
},
);
assert_eq!(
("∀ melon".to_string(), "\r\n".to_string()),
r.read_until(&ReadUntil::String("\r\n".to_string()))
.expect("cannot read line")
);
// check for EOF
match r.read_until(&ReadUntil::NBytes(10)) {
Ok(_) => panic!(),
Err(Error::EOF { .. }) => {}
Err(_) => panic!(),
}
}

#[test]
fn test_regex() {
Expand Down Expand Up @@ -413,6 +452,7 @@ mod tests {
Options {
timeout_ms: None,
strip_ansi_escape_codes: true,
..Default::default()
},
);
let bytes = r
Expand All @@ -430,6 +470,7 @@ mod tests {
Options {
timeout_ms: None,
strip_ansi_escape_codes: true,
..Default::default()
},
);
let bytes = r
Expand Down
3 changes: 3 additions & 0 deletions src/session.rs
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@ use crate::error::Error; // load error-chain
use crate::process::PtyProcess;
use crate::reader::{NBReader, Regex};
pub use crate::reader::{Options, ReadUntil};
use crate::Encoding;
use std::fs::File;
use std::io::prelude::*;
use std::io::LineWriter;
Expand Down Expand Up @@ -237,6 +238,7 @@ pub fn spawn_command(command: Command, timeout_ms: Option<u64>) -> Result<PtySes
Options {
timeout_ms,
strip_ansi_escape_codes: false,
..Default::default()
},
)
}
Expand Down Expand Up @@ -442,6 +444,7 @@ pub fn spawn_stream<R: Read + Send + 'static, W: Write>(
Options {
timeout_ms,
strip_ansi_escape_codes: false,
..Default::default()
},
)
}
Expand Down