1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
|
use std::{collections::HashMap, env::current_dir, path::PathBuf, process::exit, str::FromStr};
use log::{error, warn};
use crate::{
chunker::{constants::BUTCK_STORAGE_DIR_NAME, rw::storage::hash::ChunkWriteHash},
special_argument, special_flag,
utils::file_input_solve::parse_path_input,
};
#[derive(Debug, Default)]
pub struct ButckContext {
/// All input files
pub file_paths: Vec<PathBuf>,
/// Path of Butck Storage
pub storage_path: Option<PathBuf>,
// Display chunk boundaries
pub display_boundaries: bool,
/// Whether to read in stream mode
pub stream_read: Option<u32>,
/// Whether to read files using memory mapping
pub memmap_read: bool,
/// Register name
pub register_name: Option<String>,
/// Chunking policy name
pub policy_name: Option<String>,
/// Hash algorithm used for chunking
pub chunk_hash: ChunkWriteHash,
/// Output directory
pub output_dir: PathBuf,
/// Output file (not available for some commands)
pub output_file: Option<PathBuf>,
/// Override parameters
pub params: HashMap<String, String>,
}
impl ButckContext {
/// Apply the args of ChunkerContext to itself
pub fn from_args(mut args: Vec<String>) -> Self {
let mut ctx = ButckContext::default();
let recursive = ctx.read_recursive(&mut args);
ctx.apply_stream_read(&mut args);
ctx.apply_memmap_read(&mut args);
ctx.apply_register_name(&mut args);
ctx.apply_policy_name(&mut args);
ctx.apply_chunk_hash(&mut args);
ctx.apply_storage_dir(&mut args);
ctx.apply_output_paths(&mut args);
ctx.apply_params(&mut args);
ctx.apply_display_boundaries(&mut args);
// Finally, parse path input
ctx.file_paths = parse_path_input(args, recursive, vec![BUTCK_STORAGE_DIR_NAME]);
ctx
}
fn read_recursive(&mut self, args: &mut Vec<String>) -> bool {
special_flag!(args, "-r", "--recursive")
}
fn apply_stream_read(&mut self, args: &mut Vec<String>) {
if let Some(size_str) = special_argument!(args, "-S", "--stream-read")
&& let Ok(size) = size_str.parse::<u32>()
{
self.stream_read = Some(size);
}
}
fn apply_memmap_read(&mut self, args: &mut Vec<String>) -> bool {
special_flag!(args, "-m", "--memmap-read")
}
fn apply_register_name(&mut self, args: &mut Vec<String>) {
self.register_name = special_argument!(args, "-R", "--register");
}
fn apply_policy_name(&mut self, args: &mut Vec<String>) {
self.policy_name = special_argument!(args, "-p", "--policy");
}
fn apply_chunk_hash(&mut self, args: &mut Vec<String>) {
let chunk_hash_str = special_argument!(args, "-H", "--chunk-hash");
self.chunk_hash = match chunk_hash_str {
Some(ref s) => match s.as_str() {
"blake3" => ChunkWriteHash::Blake3,
"sha256" => ChunkWriteHash::Sha256,
_ => ChunkWriteHash::default(),
},
None => ChunkWriteHash::default(),
};
}
fn apply_output_paths(&mut self, args: &mut Vec<String>) {
let output_dir_str = special_argument!(args, "-o", "--output-dir");
let output_file_str = special_argument!(args, "-O", "--output-file");
let current_dir = current_dir().unwrap();
let output_dir = if let Some(output_dir_str) = output_dir_str {
let path = PathBuf::from(output_dir_str);
if path.exists() { Some(path) } else { None }
} else {
None
};
self.output_dir = if let Some(output_dir) = output_dir {
output_dir
} else if let Some(storage_path) = &self.storage_path {
storage_path.clone()
} else {
current_dir
};
self.output_file = output_file_str.map(PathBuf::from)
}
fn apply_params(&mut self, args: &mut Vec<String>) {
while let Some(arg) = special_argument!(args, "+p", "+param") {
let split = arg.split('=').collect::<Vec<&str>>();
if split.len() == 2 {
self.params
.insert(split[0].to_string(), split[1].to_string());
}
}
}
fn apply_storage_dir(&mut self, args: &mut Vec<String>) {
self.storage_path = {
let storage_override = match special_argument!(args, "-s", "--storage") {
Some(o) => {
let path = PathBuf::from_str(o.as_str());
if let Ok(p) = &path {
Self::init_butck_storage(p.clone());
}
path.ok()
}
None => None,
};
Self::find_butck_storage_dir(storage_override)
};
}
fn apply_display_boundaries(&mut self, args: &mut Vec<String>) {
self.display_boundaries = special_flag!(args, "-D", "--display-boundaries");
}
fn init_butck_storage(path: PathBuf) -> Option<PathBuf> {
if !path.exists() {
// If the path does not exist, create it and initialize Butck Storage here
if let Err(e) = std::fs::create_dir_all(&path) {
error!("Failed to create directory '{}': {}", path.display(), e);
exit(1);
}
let butck_dir = path.join(BUTCK_STORAGE_DIR_NAME);
if let Err(e) = std::fs::create_dir_all(&butck_dir) {
error!(
"Failed to create '{}' directory: {}",
BUTCK_STORAGE_DIR_NAME, e
);
exit(1);
}
Some(path)
} else {
let butck_dir = path.join(BUTCK_STORAGE_DIR_NAME);
// Check if Butck Storage already exists
if butck_dir.exists() {
// Butck Storage already exists, return the path
Some(path)
} else {
// Butck Storage doesn't exist, create it with a warning if directory is not empty
let is_empty = path
.read_dir()
.map(|mut entries| entries.next().is_none())
.unwrap_or(false);
if !is_empty {
// Warn about creating storage in non-empty directory
warn!(
"Creating '{}' storage in non-empty directory: {}",
BUTCK_STORAGE_DIR_NAME,
path.display()
);
}
// Create Butck Storage directory
if let Err(e) = std::fs::create_dir_all(&butck_dir) {
error!(
"Failed to create '{}' directory: {}",
BUTCK_STORAGE_DIR_NAME, e
);
exit(1);
}
Some(path)
}
}
}
// Get the ButckStorage directory based on context
fn find_butck_storage_dir(from: Option<PathBuf>) -> Option<PathBuf> {
let mut current_dir = match from {
Some(path) => path,
None => std::env::current_dir().ok()?,
};
loop {
let butck_dir = current_dir.join(BUTCK_STORAGE_DIR_NAME);
if butck_dir.is_dir() {
return Some(current_dir);
}
if !current_dir.pop() {
break;
}
}
None
}
}
|