]>
Commit | Line | Data |
---|---|---|
4ce7da51 | 1 | use std::sync::{Mutex, Arc}; |
2ab5acac | 2 | use std::path::{Path, PathBuf}; |
97168f92 | 3 | use std::os::unix::io::AsRawFd; |
a2479cfa | 4 | |
f7d4e4b5 | 5 | use anyhow::{bail, format_err, Error}; |
a2479cfa | 6 | use futures::*; |
ea368a06 | 7 | |
a2479cfa | 8 | use openssl::ssl::{SslMethod, SslAcceptor, SslFiletype}; |
7c667013 | 9 | use tokio_stream::wrappers::ReceiverStream; |
a723c087 | 10 | use serde_json::Value; |
a2479cfa | 11 | |
9ea4bce4 | 12 | use proxmox::try_block; |
a2479cfa | 13 | use proxmox::api::RpcEnvironmentType; |
32413921 | 14 | use proxmox::sys::linux::socket::set_tcp_keepalive; |
fd6d2438 DM |
15 | use proxmox::tools::fs::CreateOptions; |
16 | ||
17 | use proxmox_rest_server::ApiConfig; | |
a2479cfa | 18 | |
1298618a DM |
19 | use proxmox_backup::{ |
20 | backup::DataStore, | |
21 | server::{ | |
26858dba | 22 | auth::default_api_auth, |
1298618a | 23 | WorkerTask, |
1298618a DM |
24 | rest::*, |
25 | jobstate::{ | |
26 | self, | |
27 | Job, | |
28 | }, | |
29 | rotate_task_log_archive, | |
30 | }, | |
1298618a DM |
31 | }; |
32 | ||
af06decd | 33 | use pbs_buildcfg::configdir; |
dd2162f6 | 34 | use pbs_systemd::time::{compute_next_event, parse_calendar_event}; |
6c76aa43 | 35 | use pbs_tools::logrotate::LogRotate; |
1298618a | 36 | |
89725197 DM |
37 | use pbs_api_types::{ |
38 | Authid, TapeBackupJobConfig, VerificationJobConfig, SyncJobConfig, DataStoreConfig, | |
39 | PruneOptions, | |
40 | }; | |
e7d4be9d | 41 | |
8bca935f DM |
42 | use proxmox_rest_server::daemon; |
43 | ||
e3f41f21 | 44 | use proxmox_backup::server; |
d01e2420 | 45 | use proxmox_backup::auth_helpers::*; |
97168f92 | 46 | use proxmox_backup::tools::{ |
32413921 | 47 | PROXMOX_BACKUP_TCP_KEEPALIVE_TIME, |
97168f92 DM |
48 | disks::{ |
49 | DiskManage, | |
50 | zfs_pool_stats, | |
368f4c54 | 51 | get_pool_from_dataset, |
97168f92 | 52 | }, |
97168f92 | 53 | }; |
02c7a755 | 54 | |
e7d4be9d | 55 | |
a13573c2 | 56 | use proxmox_backup::api2::pull::do_sync_job; |
8513626b | 57 | use proxmox_backup::api2::tape::backup::do_tape_backup_job; |
1298618a | 58 | use proxmox_backup::server::do_verification_job; |
b8d90798 | 59 | use proxmox_backup::server::do_prune_job; |
a13573c2 | 60 | |
946c3e8a | 61 | fn main() -> Result<(), Error> { |
ac7513e3 DM |
62 | proxmox_backup::tools::setup_safe_path_env(); |
63 | ||
21211748 DM |
64 | let backup_uid = pbs_config::backup_user()?.uid; |
65 | let backup_gid = pbs_config::backup_group()?.gid; | |
843880f0 TL |
66 | let running_uid = nix::unistd::Uid::effective(); |
67 | let running_gid = nix::unistd::Gid::effective(); | |
68 | ||
69 | if running_uid != backup_uid || running_gid != backup_gid { | |
70 | bail!("proxy not running as backup user or group (got uid {} gid {})", running_uid, running_gid); | |
71 | } | |
72 | ||
d420962f | 73 | pbs_runtime::main(run()) |
4223d9f8 DM |
74 | } |
75 | ||
fda5797b | 76 | async fn run() -> Result<(), Error> { |
02c7a755 DM |
77 | if let Err(err) = syslog::init( |
78 | syslog::Facility::LOG_DAEMON, | |
79 | log::LevelFilter::Info, | |
80 | Some("proxmox-backup-proxy")) { | |
4223d9f8 | 81 | bail!("unable to inititialize syslog - {}", err); |
02c7a755 DM |
82 | } |
83 | ||
e1d367df DM |
84 | // Note: To debug early connection error use |
85 | // PROXMOX_DEBUG=1 ./target/release/proxmox-backup-proxy | |
86 | let debug = std::env::var("PROXMOX_DEBUG").is_ok(); | |
87 | ||
d01e2420 DM |
88 | let _ = public_auth_key(); // load with lazy_static |
89 | let _ = csrf_secret(); // load with lazy_static | |
90 | ||
02c7a755 | 91 | let mut config = ApiConfig::new( |
af06decd | 92 | pbs_buildcfg::JS_DIR, |
26858dba SR |
93 | &proxmox_backup::api2::ROUTER, |
94 | RpcEnvironmentType::PUBLIC, | |
95 | default_api_auth(), | |
96 | )?; | |
02c7a755 | 97 | |
02c7a755 DM |
98 | config.add_alias("novnc", "/usr/share/novnc-pve"); |
99 | config.add_alias("extjs", "/usr/share/javascript/extjs"); | |
7f066a9b | 100 | config.add_alias("qrcodejs", "/usr/share/javascript/qrcodejs"); |
02c7a755 DM |
101 | config.add_alias("fontawesome", "/usr/share/fonts-font-awesome"); |
102 | config.add_alias("xtermjs", "/usr/share/pve-xtermjs"); | |
abd4c4cb | 103 | config.add_alias("locale", "/usr/share/pbs-i18n"); |
02c7a755 | 104 | config.add_alias("widgettoolkit", "/usr/share/javascript/proxmox-widget-toolkit"); |
9c01e73c | 105 | config.add_alias("docs", "/usr/share/doc/proxmox-backup/html"); |
02c7a755 | 106 | |
af06decd | 107 | let mut indexpath = PathBuf::from(pbs_buildcfg::JS_DIR); |
2ab5acac DC |
108 | indexpath.push("index.hbs"); |
109 | config.register_template("index", &indexpath)?; | |
01ca99da | 110 | config.register_template("console", "/usr/share/pve-xtermjs/index.html.hbs")?; |
2ab5acac | 111 | |
fd6d2438 DM |
112 | let backup_user = pbs_config::backup_user()?; |
113 | let mut commando_sock = proxmox_rest_server::CommandoSocket::new(crate::server::our_ctrl_sock(), backup_user.gid); | |
114 | ||
115 | let dir_opts = CreateOptions::new().owner(backup_user.uid).group(backup_user.gid); | |
116 | let file_opts = CreateOptions::new().owner(backup_user.uid).group(backup_user.gid); | |
a68768cf | 117 | |
fd6d2438 DM |
118 | config.enable_file_log( |
119 | pbs_buildcfg::API_ACCESS_LOG_FN, | |
120 | Some(dir_opts), | |
121 | Some(file_opts), | |
122 | &mut commando_sock, | |
123 | )?; | |
8e7e2223 | 124 | |
02c7a755 DM |
125 | let rest_server = RestServer::new(config); |
126 | ||
6d1f61b2 | 127 | //openssl req -x509 -newkey rsa:4096 -keyout /etc/proxmox-backup/proxy.key -out /etc/proxmox-backup/proxy.pem -nodes |
6d1f61b2 | 128 | |
4ce7da51 | 129 | // we build the initial acceptor here as we cannot start if this fails |
c381a162 | 130 | let acceptor = make_tls_acceptor()?; |
4ce7da51 | 131 | let acceptor = Arc::new(Mutex::new(acceptor)); |
6d1f61b2 | 132 | |
4ce7da51 | 133 | // to renew the acceptor we just add a command-socket handler |
a723c087 WB |
134 | commando_sock.register_command( |
135 | "reload-certificate".to_string(), | |
136 | { | |
4ce7da51 | 137 | let acceptor = Arc::clone(&acceptor); |
a723c087 | 138 | move |_value| -> Result<_, Error> { |
4ce7da51 DM |
139 | log::info!("reloading certificate"); |
140 | match make_tls_acceptor() { | |
141 | Err(err) => log::error!("error reloading certificate: {}", err), | |
142 | Ok(new_acceptor) => { | |
143 | let mut guard = acceptor.lock().unwrap(); | |
144 | *guard = new_acceptor; | |
145 | } | |
146 | } | |
a723c087 WB |
147 | Ok(Value::Null) |
148 | } | |
149 | }, | |
150 | )?; | |
0d176f36 | 151 | |
062cf75c DC |
152 | // to remove references for not configured datastores |
153 | commando_sock.register_command( | |
154 | "datastore-removed".to_string(), | |
155 | |_value| { | |
156 | if let Err(err) = proxmox_backup::backup::DataStore::remove_unused_datastores() { | |
157 | log::error!("could not refresh datastores: {}", err); | |
158 | } | |
159 | Ok(Value::Null) | |
160 | } | |
161 | )?; | |
162 | ||
a690ecac WB |
163 | let server = daemon::create_daemon( |
164 | ([0,0,0,0,0,0,0,0], 8007).into(), | |
a723c087 | 165 | move |listener, ready| { |
97168f92 | 166 | |
4ce7da51 | 167 | let connections = accept_connections(listener, acceptor, debug); |
7c667013 | 168 | let connections = hyper::server::accept::from_stream(ReceiverStream::new(connections)); |
083ff3fd WB |
169 | |
170 | Ok(ready | |
48aa2b93 | 171 | .and_then(|_| hyper::Server::builder(connections) |
083ff3fd | 172 | .serve(rest_server) |
fd6d2438 | 173 | .with_graceful_shutdown(proxmox_rest_server::shutdown_future()) |
083ff3fd WB |
174 | .map_err(Error::from) |
175 | ) | |
176 | .map_err(|err| eprintln!("server error: {}", err)) | |
177 | .map(|_| ()) | |
a690ecac | 178 | ) |
a2ca7137 | 179 | }, |
d7c6ad60 | 180 | "proxmox-backup-proxy.service", |
083ff3fd | 181 | ); |
a2ca7137 | 182 | |
af06decd | 183 | server::write_pid(pbs_buildcfg::PROXMOX_BACKUP_PROXY_PID_FN)?; |
d98c9a7a WB |
184 | daemon::systemd_notify(daemon::SystemdNotify::Ready)?; |
185 | ||
fda5797b | 186 | let init_result: Result<(), Error> = try_block!({ |
a68768cf TL |
187 | server::register_task_control_commands(&mut commando_sock)?; |
188 | commando_sock.spawn()?; | |
fd6d2438 | 189 | proxmox_rest_server::server_state_init()?; |
fda5797b WB |
190 | Ok(()) |
191 | }); | |
d607b886 | 192 | |
fda5797b WB |
193 | if let Err(err) = init_result { |
194 | bail!("unable to start daemon - {}", err); | |
195 | } | |
e3f41f21 | 196 | |
8545480a | 197 | start_task_scheduler(); |
eaeda365 | 198 | start_stat_generator(); |
8545480a | 199 | |
083ff3fd | 200 | server.await?; |
a546a8a0 | 201 | log::info!("server shutting down, waiting for active workers to complete"); |
fd6d2438 | 202 | proxmox_rest_server::last_worker_future().await?; |
fda5797b | 203 | log::info!("done - exit server"); |
e3f41f21 | 204 | |
4223d9f8 | 205 | Ok(()) |
02c7a755 | 206 | } |
8545480a | 207 | |
4ce7da51 | 208 | fn make_tls_acceptor() -> Result<SslAcceptor, Error> { |
c381a162 WB |
209 | let key_path = configdir!("/proxy.key"); |
210 | let cert_path = configdir!("/proxy.pem"); | |
211 | ||
212 | let mut acceptor = SslAcceptor::mozilla_intermediate_v5(SslMethod::tls()).unwrap(); | |
213 | acceptor.set_private_key_file(key_path, SslFiletype::PEM) | |
214 | .map_err(|err| format_err!("unable to read proxy key {} - {}", key_path, err))?; | |
215 | acceptor.set_certificate_chain_file(cert_path) | |
216 | .map_err(|err| format_err!("unable to read proxy cert {} - {}", cert_path, err))?; | |
217 | acceptor.check_private_key().unwrap(); | |
218 | ||
4ce7da51 | 219 | Ok(acceptor.build()) |
c381a162 WB |
220 | } |
221 | ||
a5e3be49 WB |
222 | type ClientStreamResult = |
223 | Result<std::pin::Pin<Box<tokio_openssl::SslStream<tokio::net::TcpStream>>>, Error>; | |
224 | const MAX_PENDING_ACCEPTS: usize = 1024; | |
225 | ||
48aa2b93 | 226 | fn accept_connections( |
0bfcea6a | 227 | listener: tokio::net::TcpListener, |
4ce7da51 | 228 | acceptor: Arc<Mutex<openssl::ssl::SslAcceptor>>, |
e1d367df | 229 | debug: bool, |
a5e3be49 | 230 | ) -> tokio::sync::mpsc::Receiver<ClientStreamResult> { |
48aa2b93 | 231 | |
ea93bea7 | 232 | let (sender, receiver) = tokio::sync::mpsc::channel(MAX_PENDING_ACCEPTS); |
48aa2b93 | 233 | |
4ce7da51 | 234 | tokio::spawn(accept_connection(listener, acceptor, debug, sender)); |
a5e3be49 WB |
235 | |
236 | receiver | |
237 | } | |
238 | ||
239 | async fn accept_connection( | |
240 | listener: tokio::net::TcpListener, | |
4ce7da51 | 241 | acceptor: Arc<Mutex<openssl::ssl::SslAcceptor>>, |
a5e3be49 WB |
242 | debug: bool, |
243 | sender: tokio::sync::mpsc::Sender<ClientStreamResult>, | |
244 | ) { | |
ea93bea7 | 245 | let accept_counter = Arc::new(()); |
48aa2b93 | 246 | |
a5e3be49 | 247 | loop { |
4ce7da51 DM |
248 | let (sock, _addr) = match listener.accept().await { |
249 | Ok(conn) => conn, | |
250 | Err(err) => { | |
251 | eprintln!("error accepting tcp connection: {}", err); | |
cc269b9f | 252 | continue; |
a5e3be49 | 253 | } |
cc269b9f | 254 | }; |
48aa2b93 | 255 | |
cc269b9f WB |
256 | sock.set_nodelay(true).unwrap(); |
257 | let _ = set_tcp_keepalive(sock.as_raw_fd(), PROXMOX_BACKUP_TCP_KEEPALIVE_TIME); | |
48aa2b93 | 258 | |
4ce7da51 DM |
259 | let ssl = { // limit acceptor_guard scope |
260 | // Acceptor can be reloaded using the command socket "reload-certificate" command | |
261 | let acceptor_guard = acceptor.lock().unwrap(); | |
262 | ||
263 | match openssl::ssl::Ssl::new(acceptor_guard.context()) { | |
264 | Ok(ssl) => ssl, | |
265 | Err(err) => { | |
266 | eprintln!("failed to create Ssl object from Acceptor context - {}", err); | |
267 | continue; | |
268 | }, | |
269 | } | |
cc269b9f | 270 | }; |
4ce7da51 | 271 | |
cc269b9f WB |
272 | let stream = match tokio_openssl::SslStream::new(ssl, sock) { |
273 | Ok(stream) => stream, | |
274 | Err(err) => { | |
275 | eprintln!("failed to create SslStream using ssl and connection socket - {}", err); | |
276 | continue; | |
277 | }, | |
278 | }; | |
279 | ||
280 | let mut stream = Box::pin(stream); | |
281 | let sender = sender.clone(); | |
282 | ||
283 | if Arc::strong_count(&accept_counter) > MAX_PENDING_ACCEPTS { | |
284 | eprintln!("connection rejected - to many open connections"); | |
285 | continue; | |
48aa2b93 | 286 | } |
cc269b9f | 287 | |
b4931192 | 288 | let accept_counter = Arc::clone(&accept_counter); |
cc269b9f WB |
289 | tokio::spawn(async move { |
290 | let accept_future = tokio::time::timeout( | |
291 | Duration::new(10, 0), stream.as_mut().accept()); | |
292 | ||
293 | let result = accept_future.await; | |
294 | ||
295 | match result { | |
296 | Ok(Ok(())) => { | |
297 | if sender.send(Ok(stream)).await.is_err() && debug { | |
298 | eprintln!("detect closed connection channel"); | |
299 | } | |
300 | } | |
301 | Ok(Err(err)) => { | |
302 | if debug { | |
303 | eprintln!("https handshake failed - {}", err); | |
304 | } | |
305 | } | |
306 | Err(_) => { | |
307 | if debug { | |
308 | eprintln!("https handshake timeout"); | |
309 | } | |
310 | } | |
311 | } | |
312 | ||
313 | drop(accept_counter); // decrease reference count | |
314 | }); | |
a5e3be49 | 315 | } |
48aa2b93 DM |
316 | } |
317 | ||
eaeda365 | 318 | fn start_stat_generator() { |
fd6d2438 | 319 | let abort_future = proxmox_rest_server::shutdown_future(); |
eaeda365 DM |
320 | let future = Box::pin(run_stat_generator()); |
321 | let task = futures::future::select(future, abort_future); | |
322 | tokio::spawn(task.map(|_| ())); | |
323 | } | |
324 | ||
8545480a | 325 | fn start_task_scheduler() { |
fd6d2438 | 326 | let abort_future = proxmox_rest_server::shutdown_future(); |
8545480a DM |
327 | let future = Box::pin(run_task_scheduler()); |
328 | let task = futures::future::select(future, abort_future); | |
329 | tokio::spawn(task.map(|_| ())); | |
330 | } | |
331 | ||
6a7be83e | 332 | use std::time::{SystemTime, Instant, Duration, UNIX_EPOCH}; |
8545480a DM |
333 | |
334 | fn next_minute() -> Result<Instant, Error> { | |
6a7be83e DM |
335 | let now = SystemTime::now(); |
336 | let epoch_now = now.duration_since(UNIX_EPOCH)?; | |
337 | let epoch_next = Duration::from_secs((epoch_now.as_secs()/60 + 1)*60); | |
8545480a DM |
338 | Ok(Instant::now() + epoch_next - epoch_now) |
339 | } | |
340 | ||
341 | async fn run_task_scheduler() { | |
342 | ||
343 | let mut count: usize = 0; | |
344 | ||
345 | loop { | |
346 | count += 1; | |
347 | ||
348 | let delay_target = match next_minute() { // try to run very minute | |
349 | Ok(d) => d, | |
350 | Err(err) => { | |
351 | eprintln!("task scheduler: compute next minute failed - {}", err); | |
0a8d773a | 352 | tokio::time::sleep_until(tokio::time::Instant::from_std(Instant::now() + Duration::from_secs(60))).await; |
8545480a DM |
353 | continue; |
354 | } | |
355 | }; | |
356 | ||
357 | if count > 2 { // wait 1..2 minutes before starting | |
358 | match schedule_tasks().catch_unwind().await { | |
359 | Err(panic) => { | |
360 | match panic.downcast::<&str>() { | |
361 | Ok(msg) => { | |
362 | eprintln!("task scheduler panic: {}", msg); | |
363 | } | |
364 | Err(_) => { | |
365 | eprintln!("task scheduler panic - unknown type"); | |
366 | } | |
367 | } | |
368 | } | |
369 | Ok(Err(err)) => { | |
370 | eprintln!("task scheduler failed - {:?}", err); | |
371 | } | |
372 | Ok(Ok(_)) => {} | |
373 | } | |
374 | } | |
375 | ||
0a8d773a | 376 | tokio::time::sleep_until(tokio::time::Instant::from_std(delay_target)).await; |
8545480a DM |
377 | } |
378 | } | |
379 | ||
380 | async fn schedule_tasks() -> Result<(), Error> { | |
381 | ||
382 | schedule_datastore_garbage_collection().await; | |
25829a87 | 383 | schedule_datastore_prune().await; |
a6160cdf | 384 | schedule_datastore_sync_jobs().await; |
73df9c51 | 385 | schedule_datastore_verify_jobs().await; |
8513626b | 386 | schedule_tape_backup_jobs().await; |
9a760917 | 387 | schedule_task_log_rotate().await; |
8545480a DM |
388 | |
389 | Ok(()) | |
390 | } | |
391 | ||
8545480a DM |
392 | async fn schedule_datastore_garbage_collection() { |
393 | ||
e7d4be9d | 394 | let config = match pbs_config::datastore::config() { |
8545480a DM |
395 | Err(err) => { |
396 | eprintln!("unable to read datastore config - {}", err); | |
397 | return; | |
398 | } | |
399 | Ok((config, _digest)) => config, | |
400 | }; | |
401 | ||
402 | for (store, (_, store_config)) in config.sections { | |
403 | let datastore = match DataStore::lookup_datastore(&store) { | |
404 | Ok(datastore) => datastore, | |
405 | Err(err) => { | |
406 | eprintln!("lookup_datastore failed - {}", err); | |
407 | continue; | |
408 | } | |
409 | }; | |
410 | ||
25829a87 | 411 | let store_config: DataStoreConfig = match serde_json::from_value(store_config) { |
8545480a DM |
412 | Ok(c) => c, |
413 | Err(err) => { | |
414 | eprintln!("datastore config from_value failed - {}", err); | |
415 | continue; | |
416 | } | |
417 | }; | |
418 | ||
419 | let event_str = match store_config.gc_schedule { | |
420 | Some(event_str) => event_str, | |
421 | None => continue, | |
422 | }; | |
423 | ||
424 | let event = match parse_calendar_event(&event_str) { | |
425 | Ok(event) => event, | |
426 | Err(err) => { | |
427 | eprintln!("unable to parse schedule '{}' - {}", event_str, err); | |
428 | continue; | |
429 | } | |
430 | }; | |
431 | ||
432 | if datastore.garbage_collection_running() { continue; } | |
433 | ||
434 | let worker_type = "garbage_collection"; | |
435 | ||
b6ba5acd DC |
436 | let last = match jobstate::last_run_time(worker_type, &store) { |
437 | Ok(time) => time, | |
438 | Err(err) => { | |
439 | eprintln!("could not get last run time of {} {}: {}", worker_type, store, err); | |
440 | continue; | |
8545480a DM |
441 | } |
442 | }; | |
443 | ||
444 | let next = match compute_next_event(&event, last, false) { | |
15ec790a DC |
445 | Ok(Some(next)) => next, |
446 | Ok(None) => continue, | |
8545480a DM |
447 | Err(err) => { |
448 | eprintln!("compute_next_event for '{}' failed - {}", event_str, err); | |
449 | continue; | |
450 | } | |
451 | }; | |
e693818a | 452 | |
6a7be83e DM |
453 | let now = proxmox::tools::time::epoch_i64(); |
454 | ||
8545480a DM |
455 | if next > now { continue; } |
456 | ||
1cd951c9 | 457 | let job = match Job::new(worker_type, &store) { |
d7a122a0 DC |
458 | Ok(job) => job, |
459 | Err(_) => continue, // could not get lock | |
460 | }; | |
461 | ||
ad54df31 | 462 | let auth_id = Authid::root_auth_id(); |
d7a122a0 | 463 | |
c724f658 | 464 | if let Err(err) = crate::server::do_garbage_collection_job(job, datastore, auth_id, Some(event_str), false) { |
3b707fbb | 465 | eprintln!("unable to start garbage collection job on datastore {} - {}", store, err); |
8545480a DM |
466 | } |
467 | } | |
468 | } | |
25829a87 DM |
469 | |
470 | async fn schedule_datastore_prune() { | |
471 | ||
e7d4be9d | 472 | let config = match pbs_config::datastore::config() { |
25829a87 DM |
473 | Err(err) => { |
474 | eprintln!("unable to read datastore config - {}", err); | |
475 | return; | |
476 | } | |
477 | Ok((config, _digest)) => config, | |
478 | }; | |
479 | ||
480 | for (store, (_, store_config)) in config.sections { | |
25829a87 DM |
481 | |
482 | let store_config: DataStoreConfig = match serde_json::from_value(store_config) { | |
483 | Ok(c) => c, | |
484 | Err(err) => { | |
a6160cdf | 485 | eprintln!("datastore '{}' config from_value failed - {}", store, err); |
25829a87 DM |
486 | continue; |
487 | } | |
488 | }; | |
489 | ||
490 | let event_str = match store_config.prune_schedule { | |
491 | Some(event_str) => event_str, | |
492 | None => continue, | |
493 | }; | |
494 | ||
495 | let prune_options = PruneOptions { | |
496 | keep_last: store_config.keep_last, | |
497 | keep_hourly: store_config.keep_hourly, | |
498 | keep_daily: store_config.keep_daily, | |
499 | keep_weekly: store_config.keep_weekly, | |
500 | keep_monthly: store_config.keep_monthly, | |
501 | keep_yearly: store_config.keep_yearly, | |
502 | }; | |
503 | ||
89725197 | 504 | if !pbs_datastore::prune::keeps_something(&prune_options) { // no prune settings - keep all |
25829a87 DM |
505 | continue; |
506 | } | |
507 | ||
25829a87 | 508 | let worker_type = "prune"; |
b15751bf | 509 | if check_schedule(worker_type, &event_str, &store) { |
82c05b41 HL |
510 | let job = match Job::new(worker_type, &store) { |
511 | Ok(job) => job, | |
512 | Err(_) => continue, // could not get lock | |
513 | }; | |
25829a87 | 514 | |
ad54df31 | 515 | let auth_id = Authid::root_auth_id().clone(); |
82c05b41 HL |
516 | if let Err(err) = do_prune_job(job, prune_options, store.clone(), &auth_id, Some(event_str)) { |
517 | eprintln!("unable to start datastore prune job {} - {}", &store, err); | |
25829a87 DM |
518 | } |
519 | }; | |
25829a87 DM |
520 | } |
521 | } | |
a6160cdf DM |
522 | |
523 | async fn schedule_datastore_sync_jobs() { | |
524 | ||
a6160cdf | 525 | |
a4e5a0fc | 526 | let config = match pbs_config::sync::config() { |
a6160cdf DM |
527 | Err(err) => { |
528 | eprintln!("unable to read sync job config - {}", err); | |
529 | return; | |
530 | } | |
531 | Ok((config, _digest)) => config, | |
532 | }; | |
533 | ||
a6160cdf DM |
534 | for (job_id, (_, job_config)) in config.sections { |
535 | let job_config: SyncJobConfig = match serde_json::from_value(job_config) { | |
536 | Ok(c) => c, | |
537 | Err(err) => { | |
538 | eprintln!("sync job config from_value failed - {}", err); | |
539 | continue; | |
540 | } | |
541 | }; | |
542 | ||
543 | let event_str = match job_config.schedule { | |
544 | Some(ref event_str) => event_str.clone(), | |
545 | None => continue, | |
546 | }; | |
547 | ||
c67b1fa7 | 548 | let worker_type = "syncjob"; |
b15751bf | 549 | if check_schedule(worker_type, &event_str, &job_id) { |
82c05b41 HL |
550 | let job = match Job::new(worker_type, &job_id) { |
551 | Ok(job) => job, | |
552 | Err(_) => continue, // could not get lock | |
553 | }; | |
a6160cdf | 554 | |
ad54df31 | 555 | let auth_id = Authid::root_auth_id().clone(); |
82c05b41 HL |
556 | if let Err(err) = do_sync_job(job, job_config, &auth_id, Some(event_str)) { |
557 | eprintln!("unable to start datastore sync job {} - {}", &job_id, err); | |
a6160cdf DM |
558 | } |
559 | }; | |
a6160cdf DM |
560 | } |
561 | } | |
eaeda365 | 562 | |
73df9c51 | 563 | async fn schedule_datastore_verify_jobs() { |
1298618a | 564 | |
802189f7 | 565 | let config = match pbs_config::verify::config() { |
73df9c51 HL |
566 | Err(err) => { |
567 | eprintln!("unable to read verification job config - {}", err); | |
568 | return; | |
569 | } | |
570 | Ok((config, _digest)) => config, | |
571 | }; | |
572 | for (job_id, (_, job_config)) in config.sections { | |
573 | let job_config: VerificationJobConfig = match serde_json::from_value(job_config) { | |
574 | Ok(c) => c, | |
575 | Err(err) => { | |
576 | eprintln!("verification job config from_value failed - {}", err); | |
577 | continue; | |
578 | } | |
579 | }; | |
580 | let event_str = match job_config.schedule { | |
581 | Some(ref event_str) => event_str.clone(), | |
582 | None => continue, | |
583 | }; | |
82c05b41 | 584 | |
73df9c51 | 585 | let worker_type = "verificationjob"; |
ad54df31 | 586 | let auth_id = Authid::root_auth_id().clone(); |
b15751bf | 587 | if check_schedule(worker_type, &event_str, &job_id) { |
82c05b41 HL |
588 | let job = match Job::new(&worker_type, &job_id) { |
589 | Ok(job) => job, | |
590 | Err(_) => continue, // could not get lock | |
591 | }; | |
592 | if let Err(err) = do_verification_job(job, job_config, &auth_id, Some(event_str)) { | |
593 | eprintln!("unable to start datastore verification job {} - {}", &job_id, err); | |
73df9c51 HL |
594 | } |
595 | }; | |
73df9c51 HL |
596 | } |
597 | } | |
598 | ||
8513626b DM |
599 | async fn schedule_tape_backup_jobs() { |
600 | ||
e3619d41 | 601 | let config = match pbs_config::tape_job::config() { |
8513626b DM |
602 | Err(err) => { |
603 | eprintln!("unable to read tape job config - {}", err); | |
604 | return; | |
605 | } | |
606 | Ok((config, _digest)) => config, | |
607 | }; | |
608 | for (job_id, (_, job_config)) in config.sections { | |
609 | let job_config: TapeBackupJobConfig = match serde_json::from_value(job_config) { | |
610 | Ok(c) => c, | |
611 | Err(err) => { | |
612 | eprintln!("tape backup job config from_value failed - {}", err); | |
613 | continue; | |
614 | } | |
615 | }; | |
616 | let event_str = match job_config.schedule { | |
617 | Some(ref event_str) => event_str.clone(), | |
618 | None => continue, | |
619 | }; | |
620 | ||
621 | let worker_type = "tape-backup-job"; | |
622 | let auth_id = Authid::root_auth_id().clone(); | |
623 | if check_schedule(worker_type, &event_str, &job_id) { | |
624 | let job = match Job::new(&worker_type, &job_id) { | |
625 | Ok(job) => job, | |
626 | Err(_) => continue, // could not get lock | |
627 | }; | |
5830e562 | 628 | if let Err(err) = do_tape_backup_job(job, job_config.setup, &auth_id, Some(event_str)) { |
7a61f89e | 629 | eprintln!("unable to start tape backup job {} - {}", &job_id, err); |
8513626b DM |
630 | } |
631 | }; | |
632 | } | |
633 | } | |
634 | ||
635 | ||
9a760917 | 636 | async fn schedule_task_log_rotate() { |
9a760917 DC |
637 | |
638 | let worker_type = "logrotate"; | |
72aa1834 | 639 | let job_id = "access-log_and_task-archive"; |
9a760917 | 640 | |
9a760917 DC |
641 | // schedule daily at 00:00 like normal logrotate |
642 | let schedule = "00:00"; | |
643 | ||
b15751bf | 644 | if !check_schedule(worker_type, schedule, job_id) { |
9a760917 DC |
645 | // if we never ran the rotation, schedule instantly |
646 | match jobstate::JobState::load(worker_type, job_id) { | |
647 | Ok(state) => match state { | |
648 | jobstate::JobState::Created { .. } => {}, | |
649 | _ => return, | |
650 | }, | |
651 | _ => return, | |
652 | } | |
653 | } | |
654 | ||
655 | let mut job = match Job::new(worker_type, job_id) { | |
656 | Ok(job) => job, | |
657 | Err(_) => return, // could not get lock | |
658 | }; | |
659 | ||
660 | if let Err(err) = WorkerTask::new_thread( | |
661 | worker_type, | |
72aa1834 | 662 | None, |
ad54df31 | 663 | Authid::root_auth_id().clone(), |
9a760917 DC |
664 | false, |
665 | move |worker| { | |
666 | job.start(&worker.upid().to_string())?; | |
3b82f3ee | 667 | worker.log("starting task log rotation".to_string()); |
e4f5f59e | 668 | |
9a760917 | 669 | let result = try_block!({ |
b7f2be51 TL |
670 | let max_size = 512 * 1024 - 1; // an entry has ~ 100b, so > 5000 entries/file |
671 | let max_files = 20; // times twenty files gives > 100000 task entries | |
9a760917 DC |
672 | let has_rotated = rotate_task_log_archive(max_size, true, Some(max_files))?; |
673 | if has_rotated { | |
3b82f3ee | 674 | worker.log("task log archive was rotated".to_string()); |
9a760917 | 675 | } else { |
3b82f3ee | 676 | worker.log("task log archive was not rotated".to_string()); |
9a760917 DC |
677 | } |
678 | ||
fe4cc5b1 TL |
679 | let max_size = 32 * 1024 * 1024 - 1; |
680 | let max_files = 14; | |
af06decd | 681 | let mut logrotate = LogRotate::new(pbs_buildcfg::API_ACCESS_LOG_FN, true) |
fe4cc5b1 TL |
682 | .ok_or_else(|| format_err!("could not get API access log file names"))?; |
683 | ||
fe7bdc9d | 684 | if logrotate.rotate(max_size, None, Some(max_files))? { |
fe4cc5b1 | 685 | println!("rotated access log, telling daemons to re-open log file"); |
d420962f | 686 | pbs_runtime::block_on(command_reopen_logfiles())?; |
3b82f3ee | 687 | worker.log("API access log was rotated".to_string()); |
fe7bdc9d | 688 | } else { |
3b82f3ee | 689 | worker.log("API access log was not rotated".to_string()); |
fe7bdc9d TL |
690 | } |
691 | ||
af06decd | 692 | let mut logrotate = LogRotate::new(pbs_buildcfg::API_AUTH_LOG_FN, true) |
fe7bdc9d | 693 | .ok_or_else(|| format_err!("could not get API auth log file names"))?; |
fe4cc5b1 | 694 | |
fe7bdc9d | 695 | if logrotate.rotate(max_size, None, Some(max_files))? { |
3b82f3ee | 696 | worker.log("API authentication log was rotated".to_string()); |
fe4cc5b1 | 697 | } else { |
3b82f3ee | 698 | worker.log("API authentication log was not rotated".to_string()); |
fe4cc5b1 TL |
699 | } |
700 | ||
9a760917 DC |
701 | Ok(()) |
702 | }); | |
703 | ||
704 | let status = worker.create_state(&result); | |
705 | ||
706 | if let Err(err) = job.finish(status) { | |
707 | eprintln!("could not finish job state for {}: {}", worker_type, err); | |
708 | } | |
709 | ||
710 | result | |
711 | }, | |
712 | ) { | |
713 | eprintln!("unable to start task log rotation: {}", err); | |
714 | } | |
715 | ||
716 | } | |
717 | ||
fe4cc5b1 TL |
718 | async fn command_reopen_logfiles() -> Result<(), Error> { |
719 | // only care about the most recent daemon instance for each, proxy & api, as other older ones | |
720 | // should not respond to new requests anyway, but only finish their current one and then exit. | |
fd6d2438 DM |
721 | let sock = crate::server::our_ctrl_sock(); |
722 | let f1 = proxmox_rest_server::send_command(sock, "{\"command\":\"api-access-log-reopen\"}\n"); | |
fe4cc5b1 | 723 | |
fd6d2438 DM |
724 | let pid = crate::server::read_pid(pbs_buildcfg::PROXMOX_BACKUP_API_PID_FN)?; |
725 | let sock = crate::server::ctrl_sock_from_pid(pid); | |
726 | let f2 = proxmox_rest_server::send_command(sock, "{\"command\":\"api-access-log-reopen\"}\n"); | |
546b6a23 TL |
727 | |
728 | match futures::join!(f1, f2) { | |
729 | (Err(e1), Err(e2)) => Err(format_err!("reopen commands failed, proxy: {}; api: {}", e1, e2)), | |
730 | (Err(e1), Ok(_)) => Err(format_err!("reopen commands failed, proxy: {}", e1)), | |
731 | (Ok(_), Err(e2)) => Err(format_err!("reopen commands failed, api: {}", e2)), | |
732 | _ => Ok(()), | |
733 | } | |
fe4cc5b1 TL |
734 | } |
735 | ||
eaeda365 DM |
736 | async fn run_stat_generator() { |
737 | ||
013fa7bb | 738 | let mut count = 0; |
eaeda365 | 739 | loop { |
013fa7bb | 740 | count += 1; |
a720894f | 741 | let save = if count >= 6 { count = 0; true } else { false }; |
013fa7bb | 742 | |
eaeda365 DM |
743 | let delay_target = Instant::now() + Duration::from_secs(10); |
744 | ||
013fa7bb | 745 | generate_host_stats(save).await; |
eaeda365 | 746 | |
0a8d773a | 747 | tokio::time::sleep_until(tokio::time::Instant::from_std(delay_target)).await; |
013fa7bb DM |
748 | |
749 | } | |
eaeda365 DM |
750 | |
751 | } | |
752 | ||
013fa7bb | 753 | fn rrd_update_gauge(name: &str, value: f64, save: bool) { |
309ef20d | 754 | use proxmox_backup::rrd; |
013fa7bb | 755 | if let Err(err) = rrd::update_value(name, value, rrd::DST::Gauge, save) { |
309ef20d DM |
756 | eprintln!("rrd::update_value '{}' failed - {}", name, err); |
757 | } | |
758 | } | |
759 | ||
013fa7bb | 760 | fn rrd_update_derive(name: &str, value: f64, save: bool) { |
309ef20d | 761 | use proxmox_backup::rrd; |
013fa7bb | 762 | if let Err(err) = rrd::update_value(name, value, rrd::DST::Derive, save) { |
309ef20d DM |
763 | eprintln!("rrd::update_value '{}' failed - {}", name, err); |
764 | } | |
765 | } | |
766 | ||
013fa7bb | 767 | async fn generate_host_stats(save: bool) { |
8f0cec26 | 768 | use proxmox::sys::linux::procfs::{ |
485841da | 769 | read_meminfo, read_proc_stat, read_proc_net_dev, read_loadavg}; |
eaeda365 | 770 | |
d420962f | 771 | pbs_runtime::block_in_place(move || { |
4f951399 DM |
772 | |
773 | match read_proc_stat() { | |
774 | Ok(stat) => { | |
013fa7bb DM |
775 | rrd_update_gauge("host/cpu", stat.cpu, save); |
776 | rrd_update_gauge("host/iowait", stat.iowait_percent, save); | |
4f951399 DM |
777 | } |
778 | Err(err) => { | |
779 | eprintln!("read_proc_stat failed - {}", err); | |
eaeda365 DM |
780 | } |
781 | } | |
2c66a590 | 782 | |
4f951399 DM |
783 | match read_meminfo() { |
784 | Ok(meminfo) => { | |
013fa7bb DM |
785 | rrd_update_gauge("host/memtotal", meminfo.memtotal as f64, save); |
786 | rrd_update_gauge("host/memused", meminfo.memused as f64, save); | |
787 | rrd_update_gauge("host/swaptotal", meminfo.swaptotal as f64, save); | |
788 | rrd_update_gauge("host/swapused", meminfo.swapused as f64, save); | |
a4a3f7ca | 789 | } |
4f951399 DM |
790 | Err(err) => { |
791 | eprintln!("read_meminfo failed - {}", err); | |
a4a3f7ca DM |
792 | } |
793 | } | |
8f0cec26 | 794 | |
4f951399 DM |
795 | match read_proc_net_dev() { |
796 | Ok(netdev) => { | |
6f422880 | 797 | use pbs_config::network::is_physical_nic; |
4f951399 DM |
798 | let mut netin = 0; |
799 | let mut netout = 0; | |
800 | for item in netdev { | |
801 | if !is_physical_nic(&item.device) { continue; } | |
802 | netin += item.receive; | |
803 | netout += item.send; | |
804 | } | |
013fa7bb DM |
805 | rrd_update_derive("host/netin", netin as f64, save); |
806 | rrd_update_derive("host/netout", netout as f64, save); | |
8f0cec26 | 807 | } |
4f951399 DM |
808 | Err(err) => { |
809 | eprintln!("read_prox_net_dev failed - {}", err); | |
8f0cec26 DM |
810 | } |
811 | } | |
dd15c0aa | 812 | |
485841da DM |
813 | match read_loadavg() { |
814 | Ok(loadavg) => { | |
013fa7bb | 815 | rrd_update_gauge("host/loadavg", loadavg.0 as f64, save); |
485841da DM |
816 | } |
817 | Err(err) => { | |
818 | eprintln!("read_loadavg failed - {}", err); | |
819 | } | |
820 | } | |
821 | ||
8c03041a DM |
822 | let disk_manager = DiskManage::new(); |
823 | ||
013fa7bb | 824 | gather_disk_stats(disk_manager.clone(), Path::new("/"), "host", save); |
91e5bb49 | 825 | |
e7d4be9d | 826 | match pbs_config::datastore::config() { |
d0833a70 | 827 | Ok((config, _)) => { |
e7d4be9d | 828 | let datastore_list: Vec<DataStoreConfig> = |
17c7b46a | 829 | config.convert_to_typed_array("datastore").unwrap_or_default(); |
d0833a70 DM |
830 | |
831 | for config in datastore_list { | |
8c03041a | 832 | |
91e5bb49 | 833 | let rrd_prefix = format!("datastore/{}", config.name); |
8c03041a | 834 | let path = std::path::Path::new(&config.path); |
013fa7bb | 835 | gather_disk_stats(disk_manager.clone(), path, &rrd_prefix, save); |
d0833a70 DM |
836 | } |
837 | } | |
838 | Err(err) => { | |
839 | eprintln!("read datastore config failed - {}", err); | |
840 | } | |
841 | } | |
842 | ||
4f951399 | 843 | }); |
eaeda365 | 844 | } |
dd15c0aa | 845 | |
b15751bf DM |
846 | fn check_schedule(worker_type: &str, event_str: &str, id: &str) -> bool { |
847 | let event = match parse_calendar_event(event_str) { | |
82c05b41 HL |
848 | Ok(event) => event, |
849 | Err(err) => { | |
850 | eprintln!("unable to parse schedule '{}' - {}", event_str, err); | |
851 | return false; | |
852 | } | |
853 | }; | |
854 | ||
b15751bf | 855 | let last = match jobstate::last_run_time(worker_type, &id) { |
82c05b41 HL |
856 | Ok(time) => time, |
857 | Err(err) => { | |
858 | eprintln!("could not get last run time of {} {}: {}", worker_type, id, err); | |
859 | return false; | |
860 | } | |
861 | }; | |
862 | ||
863 | let next = match compute_next_event(&event, last, false) { | |
864 | Ok(Some(next)) => next, | |
865 | Ok(None) => return false, | |
866 | Err(err) => { | |
867 | eprintln!("compute_next_event for '{}' failed - {}", event_str, err); | |
868 | return false; | |
869 | } | |
870 | }; | |
871 | ||
872 | let now = proxmox::tools::time::epoch_i64(); | |
873 | next <= now | |
874 | } | |
875 | ||
013fa7bb | 876 | fn gather_disk_stats(disk_manager: Arc<DiskManage>, path: &Path, rrd_prefix: &str, save: bool) { |
91e5bb49 | 877 | |
934f5bb8 | 878 | match proxmox_backup::tools::disks::disk_usage(path) { |
33070956 | 879 | Ok(status) => { |
91e5bb49 | 880 | let rrd_key = format!("{}/total", rrd_prefix); |
33070956 | 881 | rrd_update_gauge(&rrd_key, status.total as f64, save); |
91e5bb49 | 882 | let rrd_key = format!("{}/used", rrd_prefix); |
33070956 | 883 | rrd_update_gauge(&rrd_key, status.used as f64, save); |
91e5bb49 DM |
884 | } |
885 | Err(err) => { | |
886 | eprintln!("read disk_usage on {:?} failed - {}", path, err); | |
887 | } | |
888 | } | |
889 | ||
934f5bb8 DM |
890 | match disk_manager.find_mounted_device(path) { |
891 | Ok(None) => {}, | |
892 | Ok(Some((fs_type, device, source))) => { | |
893 | let mut device_stat = None; | |
894 | match fs_type.as_str() { | |
895 | "zfs" => { | |
368f4c54 DC |
896 | if let Some(source) = source { |
897 | let pool = get_pool_from_dataset(&source).unwrap_or(&source); | |
898 | match zfs_pool_stats(pool) { | |
934f5bb8 DM |
899 | Ok(stat) => device_stat = stat, |
900 | Err(err) => eprintln!("zfs_pool_stats({:?}) failed - {}", pool, err), | |
91e5bb49 DM |
901 | } |
902 | } | |
934f5bb8 DM |
903 | } |
904 | _ => { | |
905 | if let Ok(disk) = disk_manager.clone().disk_by_dev_num(device.into_dev_t()) { | |
906 | match disk.read_stat() { | |
907 | Ok(stat) => device_stat = stat, | |
908 | Err(err) => eprintln!("disk.read_stat {:?} failed - {}", path, err), | |
91e5bb49 DM |
909 | } |
910 | } | |
911 | } | |
91e5bb49 | 912 | } |
934f5bb8 DM |
913 | if let Some(stat) = device_stat { |
914 | let rrd_key = format!("{}/read_ios", rrd_prefix); | |
915 | rrd_update_derive(&rrd_key, stat.read_ios as f64, save); | |
916 | let rrd_key = format!("{}/read_bytes", rrd_prefix); | |
917 | rrd_update_derive(&rrd_key, (stat.read_sectors*512) as f64, save); | |
dd15c0aa | 918 | |
934f5bb8 DM |
919 | let rrd_key = format!("{}/write_ios", rrd_prefix); |
920 | rrd_update_derive(&rrd_key, stat.write_ios as f64, save); | |
921 | let rrd_key = format!("{}/write_bytes", rrd_prefix); | |
922 | rrd_update_derive(&rrd_key, (stat.write_sectors*512) as f64, save); | |
dd15c0aa | 923 | |
934f5bb8 DM |
924 | let rrd_key = format!("{}/io_ticks", rrd_prefix); |
925 | rrd_update_derive(&rrd_key, (stat.io_ticks as f64)/1000.0, save); | |
8c03041a DM |
926 | } |
927 | } | |
934f5bb8 DM |
928 | Err(err) => { |
929 | eprintln!("find_mounted_device failed - {}", err); | |
930 | } | |
8c03041a | 931 | } |
8c03041a | 932 | } |