// Copyright 2019 The Rust Project Developers. See the COPYRIGHT // file at the top-level directory of this distribution and at // http://rust-lang.org/COPYRIGHT. // // Licensed under the Apache License, Version 2.0 or the MIT license // , at your // option. This file may not be copied, modified, or distributed // except according to those terms. //! Parameterized string expansion use self::Param::*; use self::States::*; use std::iter::repeat; #[derive(Clone, Copy, PartialEq)] enum States { Nothing, Delay, Percent, SetVar, GetVar, PushParam, CharConstant, CharClose, IntConstant(i32), FormatPattern(Flags, FormatState), SeekIfElse(usize), SeekIfElsePercent(usize), SeekIfEnd(usize), SeekIfEndPercent(usize), } #[derive(Copy, PartialEq, Clone)] enum FormatState { Flags, Width, Precision, } /// Types of parameters a capability can use #[allow(missing_docs)] #[derive(Clone)] pub enum Param { Number(i32), Words(String), } impl Default for Param { fn default() -> Self { Param::Number(0) } } /// An error from interpreting a parameterized string. #[derive(Debug, Eq, PartialEq)] pub enum Error { /// Data was requested from the stack, but the stack didn't have enough elements. StackUnderflow, /// The type of the element(s) on top of the stack did not match the type that the operator /// wanted. TypeMismatch, /// An unrecognized format option was used. UnrecognizedFormatOption(char), /// An invalid variable name was used. InvalidVariableName(char), /// An invalid parameter index was used. InvalidParameterIndex(char), /// A malformed character constant was used. MalformedCharacterConstant, /// An integer constant was too large (overflowed an i32) IntegerConstantOverflow, /// A malformed integer constant was used. MalformedIntegerConstant, /// A format width constant was too large (overflowed a usize) FormatWidthOverflow, /// A format precision constant was too large (overflowed a usize) FormatPrecisionOverflow, } impl ::std::fmt::Display for Error { fn fmt(&self, f: &mut ::std::fmt::Formatter<'_>) -> ::std::fmt::Result { use self::Error::*; match *self { StackUnderflow => f.write_str("not enough elements on the stack"), TypeMismatch => f.write_str("type mismatch"), UnrecognizedFormatOption(_) => f.write_str("unrecognized format option"), InvalidVariableName(_) => f.write_str("invalid variable name"), InvalidParameterIndex(_) => f.write_str("invalid parameter index"), MalformedCharacterConstant => f.write_str("malformed character constant"), IntegerConstantOverflow => f.write_str("integer constant computation overflowed"), MalformedIntegerConstant => f.write_str("malformed integer constant"), FormatWidthOverflow => f.write_str("format width constant computation overflowed"), FormatPrecisionOverflow => { f.write_str("format precision constant computation overflowed") } } } } impl ::std::error::Error for Error {} /// Container for static and dynamic variable arrays #[derive(Default)] pub struct Variables { /// Static variables A-Z sta_vars: [Param; 26], /// Dynamic variables a-z dyn_vars: [Param; 26], } impl Variables { /// Return a new zero-initialized Variables pub fn new() -> Variables { Default::default() } } /// Expand a parameterized capability /// /// # Arguments /// * `cap` - string to expand /// * `params` - vector of params for %p1 etc /// * `vars` - Variables struct for %Pa etc /// /// To be compatible with ncurses, `vars` should be the same between calls to `expand` for /// multiple capabilities for the same terminal. pub fn expand(cap: &[u8], params: &[Param], vars: &mut Variables) -> Result, Error> { let mut state = Nothing; // expanded cap will only rarely be larger than the cap itself let mut output = Vec::with_capacity(cap.len()); let mut stack: Vec = Vec::new(); // Copy parameters into a local vector for mutability let mut mparams = [ Number(0), Number(0), Number(0), Number(0), Number(0), Number(0), Number(0), Number(0), Number(0), ]; for (dst, src) in mparams.iter_mut().zip(params.iter()) { *dst = (*src).clone(); } for &c in cap.iter() { let cur = c as char; let mut old_state = state; match state { Nothing => { if cur == '%' { state = Percent; } else if cur == '$' { state = Delay; } else { output.push(c); } } Delay => { old_state = Nothing; if cur == '>' { state = Nothing; } } Percent => { match cur { '%' => { output.push(c); state = Nothing } 'c' => { match stack.pop() { // if c is 0, use 0200 (128) for ncurses compatibility Some(Number(0)) => output.push(128u8), // Don't check bounds. ncurses just casts and truncates. Some(Number(c)) => output.push(c as u8), Some(_) => return Err(Error::TypeMismatch), None => return Err(Error::StackUnderflow), } } 'p' => state = PushParam, 'P' => state = SetVar, 'g' => state = GetVar, '\'' => state = CharConstant, '{' => state = IntConstant(0), 'l' => match stack.pop() { Some(Words(s)) => stack.push(Number(s.len() as i32)), Some(_) => return Err(Error::TypeMismatch), None => return Err(Error::StackUnderflow), }, '+' | '-' | '/' | '*' | '^' | '&' | '|' | 'm' => { match (stack.pop(), stack.pop()) { (Some(Number(y)), Some(Number(x))) => stack.push(Number(match cur { '+' => x + y, '-' => x - y, '*' => x * y, '/' => x / y, '|' => x | y, '&' => x & y, '^' => x ^ y, 'm' => x % y, _ => unreachable!("logic error"), })), (Some(_), Some(_)) => return Err(Error::TypeMismatch), _ => return Err(Error::StackUnderflow), } } '=' | '>' | '<' | 'A' | 'O' => match (stack.pop(), stack.pop()) { (Some(Number(y)), Some(Number(x))) => stack.push(Number( if match cur { '=' => x == y, '<' => x < y, '>' => x > y, 'A' => x > 0 && y > 0, 'O' => x > 0 || y > 0, _ => unreachable!("logic error"), } { 1 } else { 0 }, )), (Some(_), Some(_)) => return Err(Error::TypeMismatch), _ => return Err(Error::StackUnderflow), }, '!' | '~' => match stack.pop() { Some(Number(x)) => stack.push(Number(match cur { '!' if x > 0 => 0, '!' => 1, '~' => !x, _ => unreachable!("logic error"), })), Some(_) => return Err(Error::TypeMismatch), None => return Err(Error::StackUnderflow), }, 'i' => match (&mparams[0], &mparams[1]) { (&Number(x), &Number(y)) => { mparams[0] = Number(x + 1); mparams[1] = Number(y + 1); } (_, _) => return Err(Error::TypeMismatch), }, // printf-style support for %doxXs 'd' | 'o' | 'x' | 'X' | 's' => { if let Some(arg) = stack.pop() { let flags = Flags::default(); let res = format(arg, FormatOp::from_char(cur), flags)?; output.extend(res); } else { return Err(Error::StackUnderflow); } } ':' | '#' | ' ' | '.' | '0'..='9' => { let mut flags = Flags::default(); let mut fstate = FormatState::Flags; match cur { ':' => (), '#' => flags.alternate = true, ' ' => flags.space = true, '.' => fstate = FormatState::Precision, '0'..='9' => { flags.width = cur as usize - '0' as usize; fstate = FormatState::Width; } _ => unreachable!("logic error"), } state = FormatPattern(flags, fstate); } // conditionals '?' | ';' => (), 't' => match stack.pop() { Some(Number(0)) => state = SeekIfElse(0), Some(Number(_)) => (), Some(_) => return Err(Error::TypeMismatch), None => return Err(Error::StackUnderflow), }, 'e' => state = SeekIfEnd(0), c => return Err(Error::UnrecognizedFormatOption(c)), } } PushParam => { // params are 1-indexed stack.push( mparams[match cur.to_digit(10) { Some(d) => d as usize - 1, None => return Err(Error::InvalidParameterIndex(cur)), }] .clone(), ); } SetVar => { if cur >= 'A' && cur <= 'Z' { if let Some(arg) = stack.pop() { let idx = (cur as u8) - b'A'; vars.sta_vars[idx as usize] = arg; } else { return Err(Error::StackUnderflow); } } else if cur >= 'a' && cur <= 'z' { if let Some(arg) = stack.pop() { let idx = (cur as u8) - b'a'; vars.dyn_vars[idx as usize] = arg; } else { return Err(Error::StackUnderflow); } } else { return Err(Error::InvalidVariableName(cur)); } } GetVar => { if cur >= 'A' && cur <= 'Z' { let idx = (cur as u8) - b'A'; stack.push(vars.sta_vars[idx as usize].clone()); } else if cur >= 'a' && cur <= 'z' { let idx = (cur as u8) - b'a'; stack.push(vars.dyn_vars[idx as usize].clone()); } else { return Err(Error::InvalidVariableName(cur)); } } CharConstant => { stack.push(Number(i32::from(c))); state = CharClose; } CharClose => { if cur != '\'' { return Err(Error::MalformedCharacterConstant); } } IntConstant(i) => { if cur == '}' { stack.push(Number(i)); state = Nothing; } else if let Some(digit) = cur.to_digit(10) { match i .checked_mul(10) .and_then(|i_ten| i_ten.checked_add(digit as i32)) { Some(i) => { state = IntConstant(i); old_state = Nothing; } None => return Err(Error::IntegerConstantOverflow), } } else { return Err(Error::MalformedIntegerConstant); } } FormatPattern(ref mut flags, ref mut fstate) => { old_state = Nothing; match (*fstate, cur) { (_, 'd') | (_, 'o') | (_, 'x') | (_, 'X') | (_, 's') => { if let Some(arg) = stack.pop() { let res = format(arg, FormatOp::from_char(cur), *flags)?; output.extend(res); // will cause state to go to Nothing old_state = FormatPattern(*flags, *fstate); } else { return Err(Error::StackUnderflow); } } (FormatState::Flags, '#') => { flags.alternate = true; } (FormatState::Flags, '-') => { flags.left = true; } (FormatState::Flags, '+') => { flags.sign = true; } (FormatState::Flags, ' ') => { flags.space = true; } (FormatState::Flags, '0'..='9') => { flags.width = cur as usize - '0' as usize; *fstate = FormatState::Width; } (FormatState::Width, '0'..='9') => { flags.width = match flags .width .checked_mul(10) .and_then(|w| w.checked_add(cur as usize - '0' as usize)) { Some(width) => width, None => return Err(Error::FormatWidthOverflow), } } (FormatState::Width, '.') | (FormatState::Flags, '.') => { *fstate = FormatState::Precision; } (FormatState::Precision, '0'..='9') => { flags.precision = match flags .precision .checked_mul(10) .and_then(|w| w.checked_add(cur as usize - '0' as usize)) { Some(precision) => precision, None => return Err(Error::FormatPrecisionOverflow), } } _ => return Err(Error::UnrecognizedFormatOption(cur)), } } SeekIfElse(level) => { if cur == '%' { state = SeekIfElsePercent(level); } old_state = Nothing; } SeekIfElsePercent(level) => { if cur == ';' { if level == 0 { state = Nothing; } else { state = SeekIfElse(level - 1); } } else if cur == 'e' && level == 0 { state = Nothing; } else if cur == '?' { state = SeekIfElse(level + 1); } else { state = SeekIfElse(level); } } SeekIfEnd(level) => { if cur == '%' { state = SeekIfEndPercent(level); } old_state = Nothing; } SeekIfEndPercent(level) => { if cur == ';' { if level == 0 { state = Nothing; } else { state = SeekIfEnd(level - 1); } } else if cur == '?' { state = SeekIfEnd(level + 1); } else { state = SeekIfEnd(level); } } } if state == old_state { state = Nothing; } } Ok(output) } #[derive(Copy, PartialEq, Clone, Default)] struct Flags { width: usize, precision: usize, alternate: bool, left: bool, sign: bool, space: bool, } #[derive(Copy, Clone)] enum FormatOp { Digit, Octal, Hex, HEX, String, } impl FormatOp { fn from_char(c: char) -> FormatOp { use self::FormatOp::*; match c { 'd' => Digit, 'o' => Octal, 'x' => Hex, 'X' => HEX, 's' => String, _ => panic!("bad FormatOp char"), } } } fn format(val: Param, op: FormatOp, flags: Flags) -> Result, Error> { use self::FormatOp::*; let mut s = match val { Number(d) => { match op { Digit => { if flags.sign { format!("{:+01$}", d, flags.precision) } else if d < 0 { // C doesn't take sign into account in precision calculation. format!("{:01$}", d, flags.precision + 1) } else if flags.space { format!(" {:01$}", d, flags.precision) } else { format!("{:01$}", d, flags.precision) } } Octal => { if flags.alternate { // Leading octal zero counts against precision. format!("0{:01$o}", d, flags.precision.saturating_sub(1)) } else { format!("{:01$o}", d, flags.precision) } } Hex => { if flags.alternate && d != 0 { format!("0x{:01$x}", d, flags.precision) } else { format!("{:01$x}", d, flags.precision) } } HEX => { if flags.alternate && d != 0 { format!("0X{:01$X}", d, flags.precision) } else { format!("{:01$X}", d, flags.precision) } } String => return Err(Error::TypeMismatch), } .into_bytes() } Words(s) => match op { String => { let mut s = s.into_bytes(); if flags.precision > 0 && flags.precision < s.len() { s.truncate(flags.precision); } s } _ => return Err(Error::TypeMismatch), }, }; if flags.width > s.len() { let n = flags.width - s.len(); if flags.left { s.extend(repeat(b' ').take(n)); } else { let mut s_ = Vec::with_capacity(flags.width); s_.extend(repeat(b' ').take(n)); s_.extend(s.into_iter()); s = s_; } } Ok(s) } #[cfg(test)] mod test { use super::Param::{self, Number, Words}; use super::{expand, Variables}; use std::result::Result::Ok; #[test] fn test_basic_setabf() { let s = b"\\E[48;5;%p1%dm"; assert_eq!( expand(s, &[Number(1)], &mut Variables::new()).unwrap(), "\\E[48;5;1m".bytes().collect::>() ); } #[test] fn test_multiple_int_constants() { assert_eq!( expand(b"%{1}%{2}%d%d", &[], &mut Variables::new()).unwrap(), "21".bytes().collect::>() ); } #[test] fn test_op_i() { let mut vars = Variables::new(); assert_eq!( expand( b"%p1%d%p2%d%p3%d%i%p1%d%p2%d%p3%d", &[Number(1), Number(2), Number(3)], &mut vars ), Ok("123233".bytes().collect::>()) ); assert_eq!( expand(b"%p1%d%p2%d%i%p1%d%p2%d", &[], &mut vars), Ok("0011".bytes().collect::>()) ); } #[test] fn test_param_stack_failure_conditions() { let mut varstruct = Variables::new(); let vars = &mut varstruct; fn get_res( fmt: &str, cap: &str, params: &[Param], vars: &mut Variables, ) -> Result, super::Error> { let mut u8v: Vec<_> = fmt.bytes().collect(); u8v.extend(cap.as_bytes().iter().cloned()); expand(&u8v, params, vars) } let caps = ["%d", "%c", "%s", "%Pa", "%l", "%!", "%~"]; for &cap in &caps { let res = get_res("", cap, &[], vars); assert!( res.is_err(), "Op {} succeeded incorrectly with 0 stack entries", cap ); let p = if cap == "%s" || cap == "%l" { Words("foo".to_owned()) } else { Number(97) }; let res = get_res("%p1", cap, &[p], vars); assert!( res.is_ok(), "Op {} failed with 1 stack entry: {}", cap, res.err().unwrap() ); } let caps = ["%+", "%-", "%*", "%/", "%m", "%&", "%|", "%A", "%O"]; for &cap in &caps { let res = expand(cap.as_bytes(), &[], vars); assert!( res.is_err(), "Binop {} succeeded incorrectly with 0 stack entries", cap ); let res = get_res("%{1}", cap, &[], vars); assert!( res.is_err(), "Binop {} succeeded incorrectly with 1 stack entry", cap ); let res = get_res("%{1}%{2}", cap, &[], vars); assert!( res.is_ok(), "Binop {} failed with 2 stack entries: {}", cap, res.err().unwrap() ); } } #[test] fn test_push_bad_param() { assert!(expand(b"%pa", &[], &mut Variables::new()).is_err()); } #[test] fn test_comparison_ops() { let v = [ ('<', [1u8, 0u8, 0u8]), ('=', [0u8, 1u8, 0u8]), ('>', [0u8, 0u8, 1u8]), ]; for &(op, bs) in &v { let s = format!("%{{1}}%{{2}}%{}%d", op); let res = expand(s.as_bytes(), &[], &mut Variables::new()); assert!(res.is_ok(), res.err().unwrap()); assert_eq!(res.unwrap(), vec![b'0' + bs[0]]); let s = format!("%{{1}}%{{1}}%{}%d", op); let res = expand(s.as_bytes(), &[], &mut Variables::new()); assert!(res.is_ok(), res.err().unwrap()); assert_eq!(res.unwrap(), vec![b'0' + bs[1]]); let s = format!("%{{2}}%{{1}}%{}%d", op); let res = expand(s.as_bytes(), &[], &mut Variables::new()); assert!(res.is_ok(), res.err().unwrap()); assert_eq!(res.unwrap(), vec![b'0' + bs[2]]); } } #[test] fn test_conditionals() { let mut vars = Variables::new(); let s = b"\\E[%?%p1%{8}%<%t3%p1%d%e%p1%{16}%<%t9%p1%{8}%-%d%e38;5;%p1%d%;m"; let res = expand(s, &[Number(1)], &mut vars); assert!(res.is_ok(), res.err().unwrap()); assert_eq!(res.unwrap(), "\\E[31m".bytes().collect::>()); let res = expand(s, &[Number(8)], &mut vars); assert!(res.is_ok(), res.err().unwrap()); assert_eq!(res.unwrap(), "\\E[90m".bytes().collect::>()); let res = expand(s, &[Number(42)], &mut vars); assert!(res.is_ok(), res.err().unwrap()); assert_eq!(res.unwrap(), "\\E[38;5;42m".bytes().collect::>()); } #[test] fn test_format() { let mut varstruct = Variables::new(); let vars = &mut varstruct; assert_eq!( expand( b"%p1%s%p2%2s%p3%2s%p4%.2s", &[ Words("foo".to_owned()), Words("foo".to_owned()), Words("f".to_owned()), Words("foo".to_owned()) ], vars ), Ok("foofoo ffo".bytes().collect::>()) ); assert_eq!( expand(b"%p1%:-4.2s", &[Words("foo".to_owned())], vars), Ok("fo ".bytes().collect::>()) ); assert_eq!( expand(b"%p1%d%p1%.3d%p1%5d%p1%:+d", &[Number(1)], vars), Ok("1001 1+1".bytes().collect::>()) ); assert_eq!( expand( b"%p1%o%p1%#o%p2%6.4x%p2%#6.4X", &[Number(15), Number(27)], vars ), Ok("17017 001b0X001B".bytes().collect::>()) ); } }