-
Notifications
You must be signed in to change notification settings - Fork 71
/
explode.rs
88 lines (70 loc) · 2.34 KB
/
explode.rs
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
static USAGE: &str = r#"
Explodes a row into multiple ones by splitting a column value based on the
given separator.
For instance the following CSV:
name,colors
John,blue|yellow
Mary,red
Can be exploded on the "colors" <column> based on the "|" <separator> to:
name,colors
John,blue
John,yellow
Mary,red
Usage:
qsv explode [options] <column> <separator> [<input>]
qsv explode --help
explode options:
-r, --rename <name> New name for the exploded column.
Common options:
-h, --help Display this message
-o, --output <file> Write output to <file> instead of stdout.
-n, --no-headers When set, the first row will not be interpreted
as headers.
-d, --delimiter <arg> The field delimiter for reading CSV data.
Must be a single character. (default: ,)
"#;
use serde::Deserialize;
use crate::{
config::{Config, Delimiter},
select::SelectColumns,
util,
util::replace_column_value,
CliResult,
};
#[derive(Deserialize)]
struct Args {
arg_column: SelectColumns,
arg_separator: String,
arg_input: Option<String>,
flag_rename: Option<String>,
flag_output: Option<String>,
flag_no_headers: bool,
flag_delimiter: Option<Delimiter>,
}
pub fn run(argv: &[&str]) -> CliResult<()> {
let args: Args = util::get_args(USAGE, argv)?;
let rconfig = Config::new(args.arg_input.as_ref())
.delimiter(args.flag_delimiter)
.no_headers(args.flag_no_headers)
.select(args.arg_column);
let mut rdr = rconfig.reader()?;
let mut wtr = Config::new(args.flag_output.as_ref()).writer()?;
let headers = rdr.byte_headers()?.clone();
let sel = rconfig.selection(&headers)?;
let column_index = *sel.iter().next().unwrap();
let mut headers = rdr.headers()?.clone();
if let Some(new_name) = args.flag_rename {
headers = replace_column_value(&headers, column_index, &new_name);
}
if !rconfig.no_headers {
wtr.write_record(&headers)?;
}
let mut record = csv::StringRecord::new();
while rdr.read_record(&mut record)? {
for val in record[column_index].split(&args.arg_separator) {
let new_record = replace_column_value(&record, column_index, val);
wtr.write_record(&new_record)?;
}
}
Ok(wtr.flush()?)
}