1
0
mirror of https://github.com/chylex/Apache-Prometheus-Exporter.git synced 2025-05-24 04:34:08 +02:00
Apache-Prometheus-Exporter/src/log_file_pattern.rs
2023-09-30 16:01:43 +02:00

229 lines
7.7 KiB
Rust

use std::{env, io};
use std::env::VarError;
use std::fs::DirEntry;
use std::io::ErrorKind;
use std::path::{Path, PathBuf};
use path_slash::PathExt;
/// Reads and parses an environment variable that determines the path and file name pattern of log files.
///
/// Supports 3 pattern types:
///
/// 1. A simple path to a file.
/// 2. A path with a wildcard anywhere in the file name.
/// 3. A path with a standalone wildcard component (i.e. no prefix or suffix in the folder name).
pub fn parse_log_file_pattern_from_env(variable_name: &str) -> Result<LogFilePattern, String> {
match env::var(variable_name) {
Ok(str) => {
let pattern_str = Path::new(&str).to_slash().ok_or(format!("Environment variable {} contains an invalid path.", variable_name))?;
parse_log_file_pattern_from_str(&pattern_str)
}
Err(err) => match err {
VarError::NotPresent => Err(format!("Environment variable {} must be set.", variable_name)),
VarError::NotUnicode(_) => Err(format!("Environment variable {} contains invalid characters.", variable_name))
}
}
}
fn parse_log_file_pattern_from_str(pattern_str: &str) -> Result<LogFilePattern, String> {
if pattern_str.trim().is_empty() {
return Err(String::from("Path is empty."));
}
if let Some((left, right)) = pattern_str.split_once('*') {
parse_log_file_pattern_split_on_wildcard(left, right)
} else {
Ok(LogFilePattern::WithoutWildcard(pattern_str.to_string()))
}
}
fn parse_log_file_pattern_split_on_wildcard(left: &str, right: &str) -> Result<LogFilePattern, String> {
if left.contains('*') || right.contains('*') {
return Err(String::from("Path has too many wildcards."));
}
if left.ends_with('/') && right.starts_with('/') {
return Ok(LogFilePattern::WithFolderNameWildcard(PatternWithFolderNameWildcard {
path_prefix: left.to_string(),
path_suffix: right[1..].to_string(),
}));
}
if right.contains('/') {
return Err(String::from("Path has a folder wildcard with a prefix or suffix."));
}
if let Some((folder_path, file_name_prefix)) = left.rsplit_once('/') {
Ok(LogFilePattern::WithFileNameWildcard(PatternWithFileNameWildcard {
path: folder_path.to_string(),
file_name_prefix: file_name_prefix.to_string(),
file_name_suffix: right.to_string(),
}))
} else {
Ok(LogFilePattern::WithFileNameWildcard(PatternWithFileNameWildcard {
path: String::new(),
file_name_prefix: left.to_string(),
file_name_suffix: right.to_string(),
}))
}
}
#[derive(Debug)]
pub struct PatternWithFileNameWildcard {
path: String,
file_name_prefix: String,
file_name_suffix: String,
}
impl PatternWithFileNameWildcard {
fn match_wildcard<'a>(&self, file_name: &'a str) -> Option<&'a str> {
return file_name.strip_prefix(&self.file_name_prefix).and_then(|r| r.strip_suffix(&self.file_name_suffix));
}
fn match_wildcard_on_dir_entry(&self, dir_entry: &DirEntry) -> Option<String> {
dir_entry.file_name()
.to_str()
.and_then(|file_name| self.match_wildcard(file_name))
.map(|wildcard_match| wildcard_match.to_string())
}
}
#[derive(Debug)]
pub struct PatternWithFolderNameWildcard {
path_prefix: String,
path_suffix: String,
}
impl PatternWithFolderNameWildcard {
fn match_wildcard_on_dir_entry(dir_entry: &DirEntry) -> Option<String> {
return if matches!(dir_entry.file_type(), Ok(entry_type) if entry_type.is_dir()) {
dir_entry.file_name().to_str().map(|s| s.into())
} else {
None
};
}
}
#[derive(Debug)]
pub enum LogFilePattern {
WithoutWildcard(String),
WithFileNameWildcard(PatternWithFileNameWildcard),
WithFolderNameWildcard(PatternWithFolderNameWildcard),
}
impl LogFilePattern {
pub fn search(&self) -> Result<Vec<LogFilePath>, io::Error> { // TODO error message
match self {
Self::WithoutWildcard(path) => Self::search_without_wildcard(path),
Self::WithFileNameWildcard(pattern) => Self::search_with_file_name_wildcard(pattern),
Self::WithFolderNameWildcard(pattern) => Self::search_with_folder_name_wildcard(pattern)
}
}
fn search_without_wildcard(path_str: &String) -> Result<Vec<LogFilePath>, io::Error> {
let path = Path::new(path_str);
let is_valid = path.is_file() || matches!(path.parent(), Some(parent) if parent.is_dir());
if is_valid {
Ok(vec![LogFilePath::with_empty_label(path_str)])
} else {
Err(io::Error::from(ErrorKind::NotFound))
}
}
fn search_with_file_name_wildcard(pattern: &PatternWithFileNameWildcard) -> Result<Vec<LogFilePath>, io::Error> {
let mut result = Vec::new();
for dir_entry in Path::new(&pattern.path).read_dir()? {
let dir_entry = dir_entry?;
if let Some(wildcard_match) = pattern.match_wildcard_on_dir_entry(&dir_entry) {
result.push(LogFilePath { path: dir_entry.path(), label: wildcard_match });
}
}
Ok(result)
}
fn search_with_folder_name_wildcard(pattern: &PatternWithFolderNameWildcard) -> Result<Vec<LogFilePath>, io::Error> {
let mut result = Vec::new();
for dir_entry in Path::new(&pattern.path_prefix).read_dir()? {
let dir_entry = dir_entry?;
if let Some(wildcard_match) = PatternWithFolderNameWildcard::match_wildcard_on_dir_entry(&dir_entry) {
let full_path = dir_entry.path().join(&pattern.path_suffix);
if full_path.is_file() {
result.push(LogFilePath { path: full_path, label: wildcard_match })
}
}
}
Ok(result)
}
}
pub struct LogFilePath {
pub path: PathBuf,
pub label: String,
}
impl LogFilePath {
fn with_empty_label(s: &String) -> LogFilePath {
LogFilePath {
path: PathBuf::from(s),
label: String::default(),
}
}
}
#[cfg(test)]
mod tests {
use crate::log_file_pattern::{LogFilePattern, parse_log_file_pattern_from_str};
#[test]
fn empty_path() {
assert!(matches!(parse_log_file_pattern_from_str(""), Err(err) if err == "Path is empty."));
assert!(matches!(parse_log_file_pattern_from_str(" "), Err(err) if err == "Path is empty."));
}
#[test]
fn too_many_wildcards() {
assert!(matches!(parse_log_file_pattern_from_str("/path/*/to/files/*.log"), Err(err) if err == "Path has too many wildcards."));
}
#[test]
fn folder_wildcard_with_prefix_not_supported() {
assert!(matches!(parse_log_file_pattern_from_str("/path/*abc/to/files/access.log"), Err(err) if err == "Path has a folder wildcard with a prefix or suffix."));
}
#[test]
fn folder_wildcard_with_suffix_not_supported() {
assert!(matches!(parse_log_file_pattern_from_str("/path/abc*/to/files/access.log"), Err(err) if err == "Path has a folder wildcard with a prefix or suffix."));
}
#[test]
fn valid_without_wildcard() {
assert!(matches!(parse_log_file_pattern_from_str("/path/to/file/access.log"), Ok(LogFilePattern::WithoutWildcard(path)) if path == "/path/to/file/access.log"));
}
#[test]
fn valid_with_file_name_wildcard_prefix() {
assert!(matches!(parse_log_file_pattern_from_str("/path/to/files/access_*"), Ok(LogFilePattern::WithFileNameWildcard(pattern)) if pattern.path == "/path/to/files" && pattern.file_name_prefix == "access_" && pattern.file_name_suffix.is_empty()));
}
#[test]
fn valid_with_file_name_wildcard_suffix() {
assert!(matches!(parse_log_file_pattern_from_str("/path/to/files/*_access.log"), Ok(LogFilePattern::WithFileNameWildcard(pattern)) if pattern.path == "/path/to/files" && pattern.file_name_prefix.is_empty() && pattern.file_name_suffix == "_access.log"));
}
#[test]
fn valid_with_file_name_wildcard_both() {
assert!(matches!(parse_log_file_pattern_from_str("/path/to/files/access_*.log"), Ok(LogFilePattern::WithFileNameWildcard(pattern)) if pattern.path == "/path/to/files" && pattern.file_name_prefix == "access_" && pattern.file_name_suffix == ".log"));
}
#[test]
fn valid_with_folder_wildcard() {
assert!(matches!(parse_log_file_pattern_from_str("/path/to/*/files/access.log"), Ok(LogFilePattern::WithFolderNameWildcard(pattern)) if pattern.path_prefix == "/path/to/" && pattern.path_suffix == "files/access.log"));
}
}