1
0
mirror of https://github.com/jht5945/finding.git synced 2025-12-27 21:20:05 +08:00
Files
finding/src/main.rs

366 lines
13 KiB
Rust

extern crate argparse;
extern crate term;
extern crate term_size;
extern crate rust_util;
use std::{
cell::RefCell,
fs::File,
path::Path,
io::prelude::*,
time::SystemTime,
};
use argparse::{ArgumentParser, StoreTrue, Store};
use rust_util::*;
const VERSION: &str = env!("CARGO_PKG_VERSION");
const GIT_HASH: &str = env!("GIT_HASH");
fn print_version() {
print!(r#"finding {} - {}
Copyright (C) 2019 Hatter Jiang.
License MIT <https://opensource.org/licenses/MIT>
Written by Hatter Jiang
"#, VERSION, &GIT_HASH[0..7]);
}
fn get_term_width() -> Option<usize> {
match term_size::dimensions() {
None => None,
Some((w, _h)) => Some(w),
}
}
// thanks https://blog.csdn.net/star_xiong/article/details/89401149
fn find_char_boundary(s: &str, index: usize) -> usize {
if s.len() <= index {
return index;
}
let mut new_index = index;
while !s.is_char_boundary(new_index) {
new_index += 1;
}
new_index
}
fn get_term_width_message(message: &str, left: usize) -> String {
match get_term_width() {
None => message.to_string(),
Some(w) => {
let len = message.len();
if w > len {
return message.to_string();
}
let mut s = String::new();
s.push_str(&message[0..find_char_boundary(&message, w-10-5-left)]);
s.push_str("[...]");
s.push_str(&message[find_char_boundary(&message, len-10)..]);
s
},
}
}
fn find_huge_files(options: &Options, dir_path: &Path) {
walk_dir(&dir_path, &|_, _| (/* do not process error */), &|p| {
match p.metadata() {
Err(err) => {
if options.verbose {
let p_str = p.to_str();
if p_str.is_some() {
print_lastline("");
print_message(MessageType::WARN, &format!("Read file {} meta failed: {}", p_str.unwrap(), err));
}
}
return;
},
Ok(metadata) => {
let len = metadata.len();
if len >= options.parsed_huge_file_size {
match p.to_str() {
None => (),
Some(p_str) => {
print_lastline("");
print_message(MessageType::OK, &format!("{} [{}]", p_str, get_display_size(len as i64)));
},
}
}
},
}
}, &|p| {
match p.to_str() {
None => (),
Some(p_str) => print_lastline(&get_term_width_message(&format!("Scanning: {}", p_str), 10)),
}
true
}).unwrap_or(());
print_lastline("");
}
fn read_file_content(file: &Path, large_file_len: u64) -> XResult<String> {
if ! file.exists() {
return Err(new_box_error(&format!("File not exists: {:?}", file)));
}
if ! file.is_file() {
return Err(new_box_error(&format!("File is not file: {:?}", file)));
}
let file_len = file.metadata()?.len();
if file_len > large_file_len {
return Err(new_box_error(&format!("File too large: {:?}, len: {}", file, file_len)));
}
let mut f = File::open(file)?;
let mut content = String::new();
f.read_to_string(&mut content)?;
Ok(content)
}
#[derive(Debug)]
struct MatchLine {
line_number: usize,
line_string: String,
}
impl MatchLine {
fn new(l_no: usize, l_str: String) -> MatchLine {
MatchLine {
line_number: l_no,
line_string: l_str,
}
}
}
fn match_lines(tag: &str, content: &String, options: &Options) -> bool {
let search_text = &options.search_text;
let lines = content.lines();
let mut match_lines_vec = vec![];
let mut l_no = 0usize;
let the_search_text = &match options.ignore_case {
true => search_text.to_lowercase(),
false => search_text.to_string(),
};
for ln in lines {
if options.filter_large_line && ln.len() as u64 >= options.parsed_large_line_size {
if options.verbose {
print_lastline("");
print_message(MessageType::INFO, &format!("Skip large line: {} bytes", ln.len()));
}
continue;
}
let matches = match options.ignore_case {
true => ln.to_lowercase().contains(the_search_text),
false => ln.contains(the_search_text),
};
if matches {
match_lines_vec.push(MatchLine::new(l_no, ln.to_string()));
}
l_no += 1;
}
let mut matches_any = false;
if match_lines_vec.len() > 0 {
print_lastline("");
print_message(MessageType::OK, &format!("Find in {}:", tag));
for i in 0..match_lines_vec.len() {
print!("{}: ", match_lines_vec[i].line_number + 1);
match options.ignore_case {
true => println!("{}", match_lines_vec[i].line_string),
false => {
let ss: Vec<&str> = match_lines_vec[i].line_string.split(search_text).collect();
for j in 0..ss.len() {
print!("{}", ss[j]);
if j < ss.len() -1 {
print_color(Some(term::color::RED), true, search_text);
}
}
println!();
},
}
}
matches_any = true;
}
matches_any
}
fn find_text_files(options: &Options, dir_path: &Path) {
if options.search_text.len() < 1 {
print_message(MessageType::ERROR, "Param search_text cannot be empty.");
return;
}
if options.ignore_case {
print_message(MessageType::WARN, "Using ignore case mode, highlight print is disabled.");
}
let file_exts = match options.file_ext.as_str() {
"" => vec![],
ext => {
ext.split(",").map(|s| s.trim()).filter(|s| s.len() > 0).map(|s| String::from(".") + s).collect()
},
};
let total_file_count_cell = RefCell::new(0u64);
let scaned_file_count_cell = RefCell::new(0u64);
let matched_file_count_cell = RefCell::new(0u64);
let total_dir_count_cell = RefCell::new(0u64);
let scaned_dir_count_cell = RefCell::new(0u64);
walk_dir(&dir_path, &|_, _| (/* do not process error */), &|p| {
total_file_count_cell.replace_with(|&mut c| c + 1);
let p_str = match p.to_str() {
None => return,
Some(s) => s,
};
if file_exts.len() > 0 {
let mut file_ext_matches = false;
for i in 0..file_exts.len() {
if p_str.to_lowercase().ends_with(&file_exts[i]) {
file_ext_matches = true;
break;
}
}
if ! file_ext_matches {
return;
}
}
let file_content = match read_file_content(p, options.parsed_large_text_file_size) {
Err(err) => {
if options.verbose {
print_lastline("");
print_message(MessageType::WARN, &format!("Read file {} failed: {}", p_str, err));
}
return;
},
Ok(c) => c,
};
scaned_file_count_cell.replace_with(|&mut c| c + 1);
if match_lines(p_str, &file_content, &options) {
matched_file_count_cell.replace_with(|&mut c| c + 1);
}
}, &|p| {
total_dir_count_cell.replace_with(|&mut c| c + 1);
match p.to_str() {
None => (),
Some(p_str) => {
if (! options.scan_dot_git) && p_str.ends_with("/.git") {
if options.verbose {
print_lastline("");
print_message(MessageType::INFO, &format!("Skip .git dir: {}", p_str));
}
return false;
}
scaned_dir_count_cell.replace_with(|&mut c| c + 1);
print_lastline(&get_term_width_message(&format!("Scanning: {}", p_str), 10))
},
}
true
}).unwrap_or(());
print_lastline("");
print_message(MessageType::OK, &format!("Total dir count: {}, scaned dir count: {}",
total_dir_count_cell.into_inner(),
scaned_dir_count_cell.into_inner()));
print_message(MessageType::OK, &format!("Total file count: {}, scaned file count: {}, matched file count: {}",
total_file_count_cell.into_inner(),
scaned_file_count_cell.into_inner(),
matched_file_count_cell.into_inner()));
}
struct Options {
version: bool,
target: String,
huge_file_size: String,
parsed_huge_file_size: u64,
large_text_file_size: String,
parsed_large_text_file_size: u64,
dir: String,
file_ext: String,
ignore_case: bool,
filter_large_line: bool,
large_line_size: String,
parsed_large_line_size: u64,
scan_dot_git: bool,
verbose: bool,
search_text: String,
}
fn main() {
let mut options = Options {
version: false,
target: String::from("text"),
huge_file_size: String::from("100M"),
parsed_huge_file_size: 0u64,
large_text_file_size: String::from("10M"),
parsed_large_text_file_size: 0u64,
file_ext: String::new(),
ignore_case: false,
dir: String::from("."),
filter_large_line: false,
large_line_size: String::from("10KB"),
parsed_large_line_size: 0u64,
scan_dot_git: false,
verbose: false,
search_text: String::new(),
};
{
let mut ap = ArgumentParser::new();
ap.set_description("finding - command line find tool.");
ap.refer(&mut options.target).add_option(&["-t", "--target"], Store, "Target, text, huge[file], default text");
ap.refer(&mut options.dir).add_option(&["-d", "--dir"], Store, "Target directory, default current dir(.)");
ap.refer(&mut options.huge_file_size).add_option(&["--huge-file"], Store, "Huge file size, default 100M");
ap.refer(&mut options.large_text_file_size).add_option(&["--large-text-file"], Store, "Large text file, default 10M");
ap.refer(&mut options.file_ext).add_option(&["-f", "--file-ext"], Store, "File ext, default all");
ap.refer(&mut options.ignore_case).add_option(&["-i", "--ignore-case"], StoreTrue, "Ignore case, default false");
ap.refer(&mut options.filter_large_line).add_option(&["--filter-large-line"], StoreTrue, "Filter large line");
ap.refer(&mut options.large_line_size).add_option(&["--large-line-size"], Store, "Large line, default 10KB");
ap.refer(&mut options.scan_dot_git).add_option(&["--scan-dot-git"], StoreTrue, "Scan dot git");
ap.refer(&mut options.version).add_option(&["-v", "--version"], StoreTrue, "Print version");
ap.refer(&mut options.verbose).add_option(&["--verbose"], StoreTrue, "Verbose");
ap.refer(&mut options.search_text).add_argument("SEARCH TEXT", Store, "Search text");
ap.parse_args_or_exit();
}
if options.version {
print_version();
return;
}
options.parsed_huge_file_size = match parse_size(&options.huge_file_size) {
Err(err) => {
print_message(MessageType::ERROR, &format!("Parse huge file size failed: {}", err));
return;
},
Ok(bytes) => bytes as u64,
};
options.parsed_large_text_file_size = match parse_size(&options.large_text_file_size) {
Err(err) => {
print_message(MessageType::ERROR, &format!("Parse large text file size failed: {}", err));
return;
},
Ok(bytes) => bytes as u64,
};
options.parsed_large_line_size = match parse_size(&options.large_line_size) {
Err(err) => {
print_message(MessageType::ERROR, &format!("Parse large line size failed: {}", err));
return;
},
Ok(bytes) => bytes as u64,
};
let dir_path = match get_absolute_path(&options.dir) {
None => {
print_message(MessageType::ERROR, &format!("Cannot find dir: {}", options.dir));
return;
},
Some(path) => path,
};
let start = SystemTime::now();
match options.target.as_str() {
"huge" | "hugefile" => find_huge_files(&options, &dir_path),
"text" => find_text_files(&options, &dir_path),
unknown => {
print_message(MessageType::ERROR, &format!("Unknown command: {}", unknown));
return;
},
}
let cost_millis = SystemTime::now().duration_since(start.clone()).unwrap().as_millis();
print_message(MessageType::OK, &format!("Finding finished, cost {} ms", cost_millis));
}