You cannot select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

182 lines
5.5 KiB
Rust

/* TODO:
* . add clap for CLI flags
* . read input as column field1920s
* . test splitting input into fields
* . execute arbitrary shell commands to manipulate input
* . dynamically generate field parameters ?
*/
#![allow(unused_imports)]
use clap::{Parser,CommandFactory};
use clap::error::ErrorKind;
use yargs::{DEFAULT_SEP_PATTERN, stdin};
use yargs::parse::InputText;
use anyhow::Result;
use std::io::{BufRead, Read, BufReader, stdin, Write};
use std::os;
use std::process::{self, Command, Stdio};
#[derive(Parser)]
/// yargs - map commands to columns of text input
///
/// The yargs command maps commands to text columns, it works like `xargs` for tabular text. Input
/// is parsed into columns then passed to commands specified by the user. Commands are mapped to
/// specific columns using positional
/// arguments.
///
/// The first command is applied to the first column, the second command to the second column, etc.
#[derive(Debug)]
#[command(name="yargs")]
#[command(author="blob42")]
#[command(version="0.1")]
struct Cli {
/// Regex used for splitting the input into columns
#[arg(default_value=DEFAULT_SEP_PATTERN)]
#[arg(short)]
delimiter: String,
//TODO:
// -f --field
// skip fields with `-`
#[arg(short, long, action = clap::ArgAction::Count)]
verbose: u8,
/// execute CMD each column of input. 0 < N_CMD < NB_COLUMNS
yargs: Vec<String>
}
fn main() -> Result<()> {
let cli = Cli::parse();
// if let None = cli.f1.as_deref() {
// eprintln!("no field --fX to operate on");
// process::exit(1);
// }
if cli.verbose > 0 {
eprintln!("======\nDEBUG:\n");
eprintln!("{:?}", cli);
for cmd in &cli.yargs {
println!("- {}", cmd);
}
}
// input validation
// take input text, split_columns, nb yargs <= nb columns
// Validate that the number of positional args <= nb of text columns
// ex: input: hello foo bar
// --
// possible ways to call the app:
// $ echo 'hello foo bar' | yargs cat rev 'tr -d b'
// $ echo 'hello foo bar' | yargs cat rev
// $ echo 'hello foo bar' | yargs cat
// let mut cmd = Cli::command();
// Read commands as positional args
// Read input from stdin
let raw_input = stdin::read_stdin()?;
let input_text = InputText::new(&raw_input, &cli.delimiter);
let n_cols = match input_text.n_cols() {
Err(e) => {
eprintln!("error parsing input: {}", e);
process::exit(1)
},
Ok(n) => n,
};
// Check that n args <= input cols
if cli.yargs.len() > input_text.n_cols()? {
// panic!("too many arguments");
eprint!("too many arguments for delimiter={:?}", input_text.sep);
process::exit(1);
}
if cli.verbose > 0 {
eprintln!("detected {n_cols} colunms");
eprintln!("======");
}
let columns = input_text.split()?;
// TODO: RESULT
if cli.yargs.is_empty() {
print!("{}", raw_input);
} else {
// Handle yargs
// For each columns of text, execute the arg command on
// the column lines
// naive implementation
// TODO: map input columns into output processed commands
for (i, yarg) in cli.yargs.into_iter().enumerate() {
// let yarg_cmd = &yarg.split_whitespace().nth(0).unwrap_or(&yarg);
// dbg!(yarg_cmd);
// let yarg_args: Vec<&str> = yarg.split_whitespace().skip(1).collect();
// dbg!(yarg_args);
// for each yarg split into cmd, args
let mut yarg_cmd = Command::new(&yarg.split_whitespace().nth(0).unwrap_or(&yarg))
.args(yarg.split_whitespace().skip(1))
.stdin(Stdio::piped())
.stdout(Stdio::piped())
.spawn()
.expect(&format!("Failed to exec {yarg}"));
let mut yarg_stdin = yarg_cmd.stdin.take().expect("failed to open stdin");
let _columns = columns.clone();
// yarg_stdin.write_all(columns[i].join("\n").as_bytes())?;
// TODO!: use https://crates.io/crates/subprocess to spawn shell
// expl: using a long `awk ..` will fail if args are split on space the cmd needs to be
// passed as is to a subshell
std::thread::spawn(move || {
yarg_stdin.write_all(_columns[i].join("\n").as_bytes()).expect("Failed to write to stdin");
});
// gather output from child
let output = yarg_cmd.wait_with_output()
.expect(format!("failed to read stdout for {}", yarg).as_str());
// TODO: gather output into column similar to input print into column format
println!("{}", String::from_utf8_lossy(&output.stdout));
}
process::exit(0);
// we know we have at least one elm
let yarg = cli.yargs.first().unwrap();
// execute the child process (yarg) using the
// piped input
// EXAMPLE: using thread to spawn the processes
// std::thread::spawn(move || {
// stdin.write_all("Hello, world!".as_bytes()).expect("Failed to write to stdin");
// });
let mut yarg_cmd = Command::new(yarg)
.stdin(Stdio::piped())
.spawn()
.expect(&format!("Failed to exec {yarg}"));
let mut yarg_stdin = yarg_cmd.stdin.take().expect("failed to open stdin");
yarg_stdin.write_all(columns[5].join("\n").as_bytes())?;
// println!("{}", String::from_utf8(output.stdout).unwrap());
}
Ok(())
}