]> git.proxmox.com Git - proxmox-backup.git/blame - src/bin/proxmox-backup-proxy.rs
move ApiConfig, FileLogger and CommandoSocket to proxmox-rest-server workspace
[proxmox-backup.git] / src / bin / proxmox-backup-proxy.rs
CommitLineData
4ce7da51 1use std::sync::{Mutex, Arc};
2ab5acac 2use std::path::{Path, PathBuf};
97168f92 3use std::os::unix::io::AsRawFd;
a2479cfa 4
f7d4e4b5 5use anyhow::{bail, format_err, Error};
a2479cfa 6use futures::*;
ea368a06 7
a2479cfa 8use openssl::ssl::{SslMethod, SslAcceptor, SslFiletype};
7c667013 9use tokio_stream::wrappers::ReceiverStream;
a723c087 10use serde_json::Value;
a2479cfa 11
9ea4bce4 12use proxmox::try_block;
a2479cfa 13use proxmox::api::RpcEnvironmentType;
32413921 14use proxmox::sys::linux::socket::set_tcp_keepalive;
fd6d2438
DM
15use proxmox::tools::fs::CreateOptions;
16
17use proxmox_rest_server::ApiConfig;
a2479cfa 18
1298618a
DM
19use proxmox_backup::{
20 backup::DataStore,
21 server::{
26858dba 22 auth::default_api_auth,
1298618a 23 WorkerTask,
1298618a
DM
24 rest::*,
25 jobstate::{
26 self,
27 Job,
28 },
29 rotate_task_log_archive,
30 },
1298618a
DM
31};
32
af06decd 33use pbs_buildcfg::configdir;
dd2162f6 34use pbs_systemd::time::{compute_next_event, parse_calendar_event};
6c76aa43 35use pbs_tools::logrotate::LogRotate;
1298618a 36
89725197
DM
37use pbs_api_types::{
38 Authid, TapeBackupJobConfig, VerificationJobConfig, SyncJobConfig, DataStoreConfig,
39 PruneOptions,
40};
e7d4be9d 41
e3f41f21 42use proxmox_backup::server;
d01e2420 43use proxmox_backup::auth_helpers::*;
97168f92 44use proxmox_backup::tools::{
32413921 45 PROXMOX_BACKUP_TCP_KEEPALIVE_TIME,
e4f5f59e 46 daemon,
97168f92
DM
47 disks::{
48 DiskManage,
49 zfs_pool_stats,
368f4c54 50 get_pool_from_dataset,
97168f92 51 },
97168f92 52};
02c7a755 53
e7d4be9d 54
a13573c2 55use proxmox_backup::api2::pull::do_sync_job;
8513626b 56use proxmox_backup::api2::tape::backup::do_tape_backup_job;
1298618a 57use proxmox_backup::server::do_verification_job;
b8d90798 58use proxmox_backup::server::do_prune_job;
a13573c2 59
946c3e8a 60fn main() -> Result<(), Error> {
ac7513e3
DM
61 proxmox_backup::tools::setup_safe_path_env();
62
21211748
DM
63 let backup_uid = pbs_config::backup_user()?.uid;
64 let backup_gid = pbs_config::backup_group()?.gid;
843880f0
TL
65 let running_uid = nix::unistd::Uid::effective();
66 let running_gid = nix::unistd::Gid::effective();
67
68 if running_uid != backup_uid || running_gid != backup_gid {
69 bail!("proxy not running as backup user or group (got uid {} gid {})", running_uid, running_gid);
70 }
71
d420962f 72 pbs_runtime::main(run())
4223d9f8
DM
73}
74
fda5797b 75async fn run() -> Result<(), Error> {
02c7a755
DM
76 if let Err(err) = syslog::init(
77 syslog::Facility::LOG_DAEMON,
78 log::LevelFilter::Info,
79 Some("proxmox-backup-proxy")) {
4223d9f8 80 bail!("unable to inititialize syslog - {}", err);
02c7a755
DM
81 }
82
e1d367df
DM
83 // Note: To debug early connection error use
84 // PROXMOX_DEBUG=1 ./target/release/proxmox-backup-proxy
85 let debug = std::env::var("PROXMOX_DEBUG").is_ok();
86
d01e2420
DM
87 let _ = public_auth_key(); // load with lazy_static
88 let _ = csrf_secret(); // load with lazy_static
89
02c7a755 90 let mut config = ApiConfig::new(
af06decd 91 pbs_buildcfg::JS_DIR,
26858dba
SR
92 &proxmox_backup::api2::ROUTER,
93 RpcEnvironmentType::PUBLIC,
94 default_api_auth(),
95 )?;
02c7a755 96
02c7a755
DM
97 config.add_alias("novnc", "/usr/share/novnc-pve");
98 config.add_alias("extjs", "/usr/share/javascript/extjs");
7f066a9b 99 config.add_alias("qrcodejs", "/usr/share/javascript/qrcodejs");
02c7a755
DM
100 config.add_alias("fontawesome", "/usr/share/fonts-font-awesome");
101 config.add_alias("xtermjs", "/usr/share/pve-xtermjs");
abd4c4cb 102 config.add_alias("locale", "/usr/share/pbs-i18n");
02c7a755 103 config.add_alias("widgettoolkit", "/usr/share/javascript/proxmox-widget-toolkit");
9c01e73c 104 config.add_alias("docs", "/usr/share/doc/proxmox-backup/html");
02c7a755 105
af06decd 106 let mut indexpath = PathBuf::from(pbs_buildcfg::JS_DIR);
2ab5acac
DC
107 indexpath.push("index.hbs");
108 config.register_template("index", &indexpath)?;
01ca99da 109 config.register_template("console", "/usr/share/pve-xtermjs/index.html.hbs")?;
2ab5acac 110
fd6d2438
DM
111 let backup_user = pbs_config::backup_user()?;
112 let mut commando_sock = proxmox_rest_server::CommandoSocket::new(crate::server::our_ctrl_sock(), backup_user.gid);
113
114 let dir_opts = CreateOptions::new().owner(backup_user.uid).group(backup_user.gid);
115 let file_opts = CreateOptions::new().owner(backup_user.uid).group(backup_user.gid);
a68768cf 116
fd6d2438
DM
117 config.enable_file_log(
118 pbs_buildcfg::API_ACCESS_LOG_FN,
119 Some(dir_opts),
120 Some(file_opts),
121 &mut commando_sock,
122 )?;
8e7e2223 123
02c7a755
DM
124 let rest_server = RestServer::new(config);
125
6d1f61b2 126 //openssl req -x509 -newkey rsa:4096 -keyout /etc/proxmox-backup/proxy.key -out /etc/proxmox-backup/proxy.pem -nodes
6d1f61b2 127
4ce7da51 128 // we build the initial acceptor here as we cannot start if this fails
c381a162 129 let acceptor = make_tls_acceptor()?;
4ce7da51 130 let acceptor = Arc::new(Mutex::new(acceptor));
6d1f61b2 131
4ce7da51 132 // to renew the acceptor we just add a command-socket handler
a723c087
WB
133 commando_sock.register_command(
134 "reload-certificate".to_string(),
135 {
4ce7da51 136 let acceptor = Arc::clone(&acceptor);
a723c087 137 move |_value| -> Result<_, Error> {
4ce7da51
DM
138 log::info!("reloading certificate");
139 match make_tls_acceptor() {
140 Err(err) => log::error!("error reloading certificate: {}", err),
141 Ok(new_acceptor) => {
142 let mut guard = acceptor.lock().unwrap();
143 *guard = new_acceptor;
144 }
145 }
a723c087
WB
146 Ok(Value::Null)
147 }
148 },
149 )?;
0d176f36 150
062cf75c
DC
151 // to remove references for not configured datastores
152 commando_sock.register_command(
153 "datastore-removed".to_string(),
154 |_value| {
155 if let Err(err) = proxmox_backup::backup::DataStore::remove_unused_datastores() {
156 log::error!("could not refresh datastores: {}", err);
157 }
158 Ok(Value::Null)
159 }
160 )?;
161
a690ecac
WB
162 let server = daemon::create_daemon(
163 ([0,0,0,0,0,0,0,0], 8007).into(),
a723c087 164 move |listener, ready| {
97168f92 165
4ce7da51 166 let connections = accept_connections(listener, acceptor, debug);
7c667013 167 let connections = hyper::server::accept::from_stream(ReceiverStream::new(connections));
083ff3fd
WB
168
169 Ok(ready
48aa2b93 170 .and_then(|_| hyper::Server::builder(connections)
083ff3fd 171 .serve(rest_server)
fd6d2438 172 .with_graceful_shutdown(proxmox_rest_server::shutdown_future())
083ff3fd
WB
173 .map_err(Error::from)
174 )
175 .map_err(|err| eprintln!("server error: {}", err))
176 .map(|_| ())
a690ecac 177 )
a2ca7137 178 },
d7c6ad60 179 "proxmox-backup-proxy.service",
083ff3fd 180 );
a2ca7137 181
af06decd 182 server::write_pid(pbs_buildcfg::PROXMOX_BACKUP_PROXY_PID_FN)?;
d98c9a7a
WB
183 daemon::systemd_notify(daemon::SystemdNotify::Ready)?;
184
fda5797b 185 let init_result: Result<(), Error> = try_block!({
a68768cf
TL
186 server::register_task_control_commands(&mut commando_sock)?;
187 commando_sock.spawn()?;
fd6d2438 188 proxmox_rest_server::server_state_init()?;
fda5797b
WB
189 Ok(())
190 });
d607b886 191
fda5797b
WB
192 if let Err(err) = init_result {
193 bail!("unable to start daemon - {}", err);
194 }
e3f41f21 195
8545480a 196 start_task_scheduler();
eaeda365 197 start_stat_generator();
8545480a 198
083ff3fd 199 server.await?;
a546a8a0 200 log::info!("server shutting down, waiting for active workers to complete");
fd6d2438 201 proxmox_rest_server::last_worker_future().await?;
fda5797b 202 log::info!("done - exit server");
e3f41f21 203
4223d9f8 204 Ok(())
02c7a755 205}
8545480a 206
4ce7da51 207fn make_tls_acceptor() -> Result<SslAcceptor, Error> {
c381a162
WB
208 let key_path = configdir!("/proxy.key");
209 let cert_path = configdir!("/proxy.pem");
210
211 let mut acceptor = SslAcceptor::mozilla_intermediate_v5(SslMethod::tls()).unwrap();
212 acceptor.set_private_key_file(key_path, SslFiletype::PEM)
213 .map_err(|err| format_err!("unable to read proxy key {} - {}", key_path, err))?;
214 acceptor.set_certificate_chain_file(cert_path)
215 .map_err(|err| format_err!("unable to read proxy cert {} - {}", cert_path, err))?;
216 acceptor.check_private_key().unwrap();
217
4ce7da51 218 Ok(acceptor.build())
c381a162
WB
219}
220
a5e3be49
WB
221type ClientStreamResult =
222 Result<std::pin::Pin<Box<tokio_openssl::SslStream<tokio::net::TcpStream>>>, Error>;
223const MAX_PENDING_ACCEPTS: usize = 1024;
224
48aa2b93 225fn accept_connections(
0bfcea6a 226 listener: tokio::net::TcpListener,
4ce7da51 227 acceptor: Arc<Mutex<openssl::ssl::SslAcceptor>>,
e1d367df 228 debug: bool,
a5e3be49 229) -> tokio::sync::mpsc::Receiver<ClientStreamResult> {
48aa2b93 230
ea93bea7 231 let (sender, receiver) = tokio::sync::mpsc::channel(MAX_PENDING_ACCEPTS);
48aa2b93 232
4ce7da51 233 tokio::spawn(accept_connection(listener, acceptor, debug, sender));
a5e3be49
WB
234
235 receiver
236}
237
238async fn accept_connection(
239 listener: tokio::net::TcpListener,
4ce7da51 240 acceptor: Arc<Mutex<openssl::ssl::SslAcceptor>>,
a5e3be49
WB
241 debug: bool,
242 sender: tokio::sync::mpsc::Sender<ClientStreamResult>,
243) {
ea93bea7 244 let accept_counter = Arc::new(());
48aa2b93 245
a5e3be49 246 loop {
4ce7da51
DM
247 let (sock, _addr) = match listener.accept().await {
248 Ok(conn) => conn,
249 Err(err) => {
250 eprintln!("error accepting tcp connection: {}", err);
cc269b9f 251 continue;
a5e3be49 252 }
cc269b9f 253 };
48aa2b93 254
cc269b9f
WB
255 sock.set_nodelay(true).unwrap();
256 let _ = set_tcp_keepalive(sock.as_raw_fd(), PROXMOX_BACKUP_TCP_KEEPALIVE_TIME);
48aa2b93 257
4ce7da51
DM
258 let ssl = { // limit acceptor_guard scope
259 // Acceptor can be reloaded using the command socket "reload-certificate" command
260 let acceptor_guard = acceptor.lock().unwrap();
261
262 match openssl::ssl::Ssl::new(acceptor_guard.context()) {
263 Ok(ssl) => ssl,
264 Err(err) => {
265 eprintln!("failed to create Ssl object from Acceptor context - {}", err);
266 continue;
267 },
268 }
cc269b9f 269 };
4ce7da51 270
cc269b9f
WB
271 let stream = match tokio_openssl::SslStream::new(ssl, sock) {
272 Ok(stream) => stream,
273 Err(err) => {
274 eprintln!("failed to create SslStream using ssl and connection socket - {}", err);
275 continue;
276 },
277 };
278
279 let mut stream = Box::pin(stream);
280 let sender = sender.clone();
281
282 if Arc::strong_count(&accept_counter) > MAX_PENDING_ACCEPTS {
283 eprintln!("connection rejected - to many open connections");
284 continue;
48aa2b93 285 }
cc269b9f 286
b4931192 287 let accept_counter = Arc::clone(&accept_counter);
cc269b9f
WB
288 tokio::spawn(async move {
289 let accept_future = tokio::time::timeout(
290 Duration::new(10, 0), stream.as_mut().accept());
291
292 let result = accept_future.await;
293
294 match result {
295 Ok(Ok(())) => {
296 if sender.send(Ok(stream)).await.is_err() && debug {
297 eprintln!("detect closed connection channel");
298 }
299 }
300 Ok(Err(err)) => {
301 if debug {
302 eprintln!("https handshake failed - {}", err);
303 }
304 }
305 Err(_) => {
306 if debug {
307 eprintln!("https handshake timeout");
308 }
309 }
310 }
311
312 drop(accept_counter); // decrease reference count
313 });
a5e3be49 314 }
48aa2b93
DM
315}
316
eaeda365 317fn start_stat_generator() {
fd6d2438 318 let abort_future = proxmox_rest_server::shutdown_future();
eaeda365
DM
319 let future = Box::pin(run_stat_generator());
320 let task = futures::future::select(future, abort_future);
321 tokio::spawn(task.map(|_| ()));
322}
323
8545480a 324fn start_task_scheduler() {
fd6d2438 325 let abort_future = proxmox_rest_server::shutdown_future();
8545480a
DM
326 let future = Box::pin(run_task_scheduler());
327 let task = futures::future::select(future, abort_future);
328 tokio::spawn(task.map(|_| ()));
329}
330
6a7be83e 331use std::time::{SystemTime, Instant, Duration, UNIX_EPOCH};
8545480a
DM
332
333fn next_minute() -> Result<Instant, Error> {
6a7be83e
DM
334 let now = SystemTime::now();
335 let epoch_now = now.duration_since(UNIX_EPOCH)?;
336 let epoch_next = Duration::from_secs((epoch_now.as_secs()/60 + 1)*60);
8545480a
DM
337 Ok(Instant::now() + epoch_next - epoch_now)
338}
339
340async fn run_task_scheduler() {
341
342 let mut count: usize = 0;
343
344 loop {
345 count += 1;
346
347 let delay_target = match next_minute() { // try to run very minute
348 Ok(d) => d,
349 Err(err) => {
350 eprintln!("task scheduler: compute next minute failed - {}", err);
0a8d773a 351 tokio::time::sleep_until(tokio::time::Instant::from_std(Instant::now() + Duration::from_secs(60))).await;
8545480a
DM
352 continue;
353 }
354 };
355
356 if count > 2 { // wait 1..2 minutes before starting
357 match schedule_tasks().catch_unwind().await {
358 Err(panic) => {
359 match panic.downcast::<&str>() {
360 Ok(msg) => {
361 eprintln!("task scheduler panic: {}", msg);
362 }
363 Err(_) => {
364 eprintln!("task scheduler panic - unknown type");
365 }
366 }
367 }
368 Ok(Err(err)) => {
369 eprintln!("task scheduler failed - {:?}", err);
370 }
371 Ok(Ok(_)) => {}
372 }
373 }
374
0a8d773a 375 tokio::time::sleep_until(tokio::time::Instant::from_std(delay_target)).await;
8545480a
DM
376 }
377}
378
379async fn schedule_tasks() -> Result<(), Error> {
380
381 schedule_datastore_garbage_collection().await;
25829a87 382 schedule_datastore_prune().await;
a6160cdf 383 schedule_datastore_sync_jobs().await;
73df9c51 384 schedule_datastore_verify_jobs().await;
8513626b 385 schedule_tape_backup_jobs().await;
9a760917 386 schedule_task_log_rotate().await;
8545480a
DM
387
388 Ok(())
389}
390
8545480a
DM
391async fn schedule_datastore_garbage_collection() {
392
e7d4be9d 393 let config = match pbs_config::datastore::config() {
8545480a
DM
394 Err(err) => {
395 eprintln!("unable to read datastore config - {}", err);
396 return;
397 }
398 Ok((config, _digest)) => config,
399 };
400
401 for (store, (_, store_config)) in config.sections {
402 let datastore = match DataStore::lookup_datastore(&store) {
403 Ok(datastore) => datastore,
404 Err(err) => {
405 eprintln!("lookup_datastore failed - {}", err);
406 continue;
407 }
408 };
409
25829a87 410 let store_config: DataStoreConfig = match serde_json::from_value(store_config) {
8545480a
DM
411 Ok(c) => c,
412 Err(err) => {
413 eprintln!("datastore config from_value failed - {}", err);
414 continue;
415 }
416 };
417
418 let event_str = match store_config.gc_schedule {
419 Some(event_str) => event_str,
420 None => continue,
421 };
422
423 let event = match parse_calendar_event(&event_str) {
424 Ok(event) => event,
425 Err(err) => {
426 eprintln!("unable to parse schedule '{}' - {}", event_str, err);
427 continue;
428 }
429 };
430
431 if datastore.garbage_collection_running() { continue; }
432
433 let worker_type = "garbage_collection";
434
b6ba5acd
DC
435 let last = match jobstate::last_run_time(worker_type, &store) {
436 Ok(time) => time,
437 Err(err) => {
438 eprintln!("could not get last run time of {} {}: {}", worker_type, store, err);
439 continue;
8545480a
DM
440 }
441 };
442
443 let next = match compute_next_event(&event, last, false) {
15ec790a
DC
444 Ok(Some(next)) => next,
445 Ok(None) => continue,
8545480a
DM
446 Err(err) => {
447 eprintln!("compute_next_event for '{}' failed - {}", event_str, err);
448 continue;
449 }
450 };
e693818a 451
6a7be83e
DM
452 let now = proxmox::tools::time::epoch_i64();
453
8545480a
DM
454 if next > now { continue; }
455
1cd951c9 456 let job = match Job::new(worker_type, &store) {
d7a122a0
DC
457 Ok(job) => job,
458 Err(_) => continue, // could not get lock
459 };
460
ad54df31 461 let auth_id = Authid::root_auth_id();
d7a122a0 462
c724f658 463 if let Err(err) = crate::server::do_garbage_collection_job(job, datastore, auth_id, Some(event_str), false) {
3b707fbb 464 eprintln!("unable to start garbage collection job on datastore {} - {}", store, err);
8545480a
DM
465 }
466 }
467}
25829a87
DM
468
469async fn schedule_datastore_prune() {
470
e7d4be9d 471 let config = match pbs_config::datastore::config() {
25829a87
DM
472 Err(err) => {
473 eprintln!("unable to read datastore config - {}", err);
474 return;
475 }
476 Ok((config, _digest)) => config,
477 };
478
479 for (store, (_, store_config)) in config.sections {
25829a87
DM
480
481 let store_config: DataStoreConfig = match serde_json::from_value(store_config) {
482 Ok(c) => c,
483 Err(err) => {
a6160cdf 484 eprintln!("datastore '{}' config from_value failed - {}", store, err);
25829a87
DM
485 continue;
486 }
487 };
488
489 let event_str = match store_config.prune_schedule {
490 Some(event_str) => event_str,
491 None => continue,
492 };
493
494 let prune_options = PruneOptions {
495 keep_last: store_config.keep_last,
496 keep_hourly: store_config.keep_hourly,
497 keep_daily: store_config.keep_daily,
498 keep_weekly: store_config.keep_weekly,
499 keep_monthly: store_config.keep_monthly,
500 keep_yearly: store_config.keep_yearly,
501 };
502
89725197 503 if !pbs_datastore::prune::keeps_something(&prune_options) { // no prune settings - keep all
25829a87
DM
504 continue;
505 }
506
25829a87 507 let worker_type = "prune";
b15751bf 508 if check_schedule(worker_type, &event_str, &store) {
82c05b41
HL
509 let job = match Job::new(worker_type, &store) {
510 Ok(job) => job,
511 Err(_) => continue, // could not get lock
512 };
25829a87 513
ad54df31 514 let auth_id = Authid::root_auth_id().clone();
82c05b41
HL
515 if let Err(err) = do_prune_job(job, prune_options, store.clone(), &auth_id, Some(event_str)) {
516 eprintln!("unable to start datastore prune job {} - {}", &store, err);
25829a87
DM
517 }
518 };
25829a87
DM
519 }
520}
a6160cdf
DM
521
522async fn schedule_datastore_sync_jobs() {
523
a6160cdf 524
a4e5a0fc 525 let config = match pbs_config::sync::config() {
a6160cdf
DM
526 Err(err) => {
527 eprintln!("unable to read sync job config - {}", err);
528 return;
529 }
530 Ok((config, _digest)) => config,
531 };
532
a6160cdf
DM
533 for (job_id, (_, job_config)) in config.sections {
534 let job_config: SyncJobConfig = match serde_json::from_value(job_config) {
535 Ok(c) => c,
536 Err(err) => {
537 eprintln!("sync job config from_value failed - {}", err);
538 continue;
539 }
540 };
541
542 let event_str = match job_config.schedule {
543 Some(ref event_str) => event_str.clone(),
544 None => continue,
545 };
546
c67b1fa7 547 let worker_type = "syncjob";
b15751bf 548 if check_schedule(worker_type, &event_str, &job_id) {
82c05b41
HL
549 let job = match Job::new(worker_type, &job_id) {
550 Ok(job) => job,
551 Err(_) => continue, // could not get lock
552 };
a6160cdf 553
ad54df31 554 let auth_id = Authid::root_auth_id().clone();
82c05b41
HL
555 if let Err(err) = do_sync_job(job, job_config, &auth_id, Some(event_str)) {
556 eprintln!("unable to start datastore sync job {} - {}", &job_id, err);
a6160cdf
DM
557 }
558 };
a6160cdf
DM
559 }
560}
eaeda365 561
73df9c51 562async fn schedule_datastore_verify_jobs() {
1298618a 563
802189f7 564 let config = match pbs_config::verify::config() {
73df9c51
HL
565 Err(err) => {
566 eprintln!("unable to read verification job config - {}", err);
567 return;
568 }
569 Ok((config, _digest)) => config,
570 };
571 for (job_id, (_, job_config)) in config.sections {
572 let job_config: VerificationJobConfig = match serde_json::from_value(job_config) {
573 Ok(c) => c,
574 Err(err) => {
575 eprintln!("verification job config from_value failed - {}", err);
576 continue;
577 }
578 };
579 let event_str = match job_config.schedule {
580 Some(ref event_str) => event_str.clone(),
581 None => continue,
582 };
82c05b41 583
73df9c51 584 let worker_type = "verificationjob";
ad54df31 585 let auth_id = Authid::root_auth_id().clone();
b15751bf 586 if check_schedule(worker_type, &event_str, &job_id) {
82c05b41
HL
587 let job = match Job::new(&worker_type, &job_id) {
588 Ok(job) => job,
589 Err(_) => continue, // could not get lock
590 };
591 if let Err(err) = do_verification_job(job, job_config, &auth_id, Some(event_str)) {
592 eprintln!("unable to start datastore verification job {} - {}", &job_id, err);
73df9c51
HL
593 }
594 };
73df9c51
HL
595 }
596}
597
8513626b
DM
598async fn schedule_tape_backup_jobs() {
599
e3619d41 600 let config = match pbs_config::tape_job::config() {
8513626b
DM
601 Err(err) => {
602 eprintln!("unable to read tape job config - {}", err);
603 return;
604 }
605 Ok((config, _digest)) => config,
606 };
607 for (job_id, (_, job_config)) in config.sections {
608 let job_config: TapeBackupJobConfig = match serde_json::from_value(job_config) {
609 Ok(c) => c,
610 Err(err) => {
611 eprintln!("tape backup job config from_value failed - {}", err);
612 continue;
613 }
614 };
615 let event_str = match job_config.schedule {
616 Some(ref event_str) => event_str.clone(),
617 None => continue,
618 };
619
620 let worker_type = "tape-backup-job";
621 let auth_id = Authid::root_auth_id().clone();
622 if check_schedule(worker_type, &event_str, &job_id) {
623 let job = match Job::new(&worker_type, &job_id) {
624 Ok(job) => job,
625 Err(_) => continue, // could not get lock
626 };
5830e562 627 if let Err(err) = do_tape_backup_job(job, job_config.setup, &auth_id, Some(event_str)) {
7a61f89e 628 eprintln!("unable to start tape backup job {} - {}", &job_id, err);
8513626b
DM
629 }
630 };
631 }
632}
633
634
9a760917 635async fn schedule_task_log_rotate() {
9a760917
DC
636
637 let worker_type = "logrotate";
72aa1834 638 let job_id = "access-log_and_task-archive";
9a760917 639
9a760917
DC
640 // schedule daily at 00:00 like normal logrotate
641 let schedule = "00:00";
642
b15751bf 643 if !check_schedule(worker_type, schedule, job_id) {
9a760917
DC
644 // if we never ran the rotation, schedule instantly
645 match jobstate::JobState::load(worker_type, job_id) {
646 Ok(state) => match state {
647 jobstate::JobState::Created { .. } => {},
648 _ => return,
649 },
650 _ => return,
651 }
652 }
653
654 let mut job = match Job::new(worker_type, job_id) {
655 Ok(job) => job,
656 Err(_) => return, // could not get lock
657 };
658
659 if let Err(err) = WorkerTask::new_thread(
660 worker_type,
72aa1834 661 None,
ad54df31 662 Authid::root_auth_id().clone(),
9a760917
DC
663 false,
664 move |worker| {
665 job.start(&worker.upid().to_string())?;
3b82f3ee 666 worker.log("starting task log rotation".to_string());
e4f5f59e 667
9a760917 668 let result = try_block!({
b7f2be51
TL
669 let max_size = 512 * 1024 - 1; // an entry has ~ 100b, so > 5000 entries/file
670 let max_files = 20; // times twenty files gives > 100000 task entries
9a760917
DC
671 let has_rotated = rotate_task_log_archive(max_size, true, Some(max_files))?;
672 if has_rotated {
3b82f3ee 673 worker.log("task log archive was rotated".to_string());
9a760917 674 } else {
3b82f3ee 675 worker.log("task log archive was not rotated".to_string());
9a760917
DC
676 }
677
fe4cc5b1
TL
678 let max_size = 32 * 1024 * 1024 - 1;
679 let max_files = 14;
af06decd 680 let mut logrotate = LogRotate::new(pbs_buildcfg::API_ACCESS_LOG_FN, true)
fe4cc5b1
TL
681 .ok_or_else(|| format_err!("could not get API access log file names"))?;
682
fe7bdc9d 683 if logrotate.rotate(max_size, None, Some(max_files))? {
fe4cc5b1 684 println!("rotated access log, telling daemons to re-open log file");
d420962f 685 pbs_runtime::block_on(command_reopen_logfiles())?;
3b82f3ee 686 worker.log("API access log was rotated".to_string());
fe7bdc9d 687 } else {
3b82f3ee 688 worker.log("API access log was not rotated".to_string());
fe7bdc9d
TL
689 }
690
af06decd 691 let mut logrotate = LogRotate::new(pbs_buildcfg::API_AUTH_LOG_FN, true)
fe7bdc9d 692 .ok_or_else(|| format_err!("could not get API auth log file names"))?;
fe4cc5b1 693
fe7bdc9d 694 if logrotate.rotate(max_size, None, Some(max_files))? {
3b82f3ee 695 worker.log("API authentication log was rotated".to_string());
fe4cc5b1 696 } else {
3b82f3ee 697 worker.log("API authentication log was not rotated".to_string());
fe4cc5b1
TL
698 }
699
9a760917
DC
700 Ok(())
701 });
702
703 let status = worker.create_state(&result);
704
705 if let Err(err) = job.finish(status) {
706 eprintln!("could not finish job state for {}: {}", worker_type, err);
707 }
708
709 result
710 },
711 ) {
712 eprintln!("unable to start task log rotation: {}", err);
713 }
714
715}
716
fe4cc5b1
TL
717async fn command_reopen_logfiles() -> Result<(), Error> {
718 // only care about the most recent daemon instance for each, proxy & api, as other older ones
719 // should not respond to new requests anyway, but only finish their current one and then exit.
fd6d2438
DM
720 let sock = crate::server::our_ctrl_sock();
721 let f1 = proxmox_rest_server::send_command(sock, "{\"command\":\"api-access-log-reopen\"}\n");
fe4cc5b1 722
fd6d2438
DM
723 let pid = crate::server::read_pid(pbs_buildcfg::PROXMOX_BACKUP_API_PID_FN)?;
724 let sock = crate::server::ctrl_sock_from_pid(pid);
725 let f2 = proxmox_rest_server::send_command(sock, "{\"command\":\"api-access-log-reopen\"}\n");
546b6a23
TL
726
727 match futures::join!(f1, f2) {
728 (Err(e1), Err(e2)) => Err(format_err!("reopen commands failed, proxy: {}; api: {}", e1, e2)),
729 (Err(e1), Ok(_)) => Err(format_err!("reopen commands failed, proxy: {}", e1)),
730 (Ok(_), Err(e2)) => Err(format_err!("reopen commands failed, api: {}", e2)),
731 _ => Ok(()),
732 }
fe4cc5b1
TL
733}
734
eaeda365
DM
735async fn run_stat_generator() {
736
013fa7bb 737 let mut count = 0;
eaeda365 738 loop {
013fa7bb 739 count += 1;
a720894f 740 let save = if count >= 6 { count = 0; true } else { false };
013fa7bb 741
eaeda365
DM
742 let delay_target = Instant::now() + Duration::from_secs(10);
743
013fa7bb 744 generate_host_stats(save).await;
eaeda365 745
0a8d773a 746 tokio::time::sleep_until(tokio::time::Instant::from_std(delay_target)).await;
013fa7bb
DM
747
748 }
eaeda365
DM
749
750}
751
013fa7bb 752fn rrd_update_gauge(name: &str, value: f64, save: bool) {
309ef20d 753 use proxmox_backup::rrd;
013fa7bb 754 if let Err(err) = rrd::update_value(name, value, rrd::DST::Gauge, save) {
309ef20d
DM
755 eprintln!("rrd::update_value '{}' failed - {}", name, err);
756 }
757}
758
013fa7bb 759fn rrd_update_derive(name: &str, value: f64, save: bool) {
309ef20d 760 use proxmox_backup::rrd;
013fa7bb 761 if let Err(err) = rrd::update_value(name, value, rrd::DST::Derive, save) {
309ef20d
DM
762 eprintln!("rrd::update_value '{}' failed - {}", name, err);
763 }
764}
765
013fa7bb 766async fn generate_host_stats(save: bool) {
8f0cec26 767 use proxmox::sys::linux::procfs::{
485841da 768 read_meminfo, read_proc_stat, read_proc_net_dev, read_loadavg};
eaeda365 769
d420962f 770 pbs_runtime::block_in_place(move || {
4f951399
DM
771
772 match read_proc_stat() {
773 Ok(stat) => {
013fa7bb
DM
774 rrd_update_gauge("host/cpu", stat.cpu, save);
775 rrd_update_gauge("host/iowait", stat.iowait_percent, save);
4f951399
DM
776 }
777 Err(err) => {
778 eprintln!("read_proc_stat failed - {}", err);
eaeda365
DM
779 }
780 }
2c66a590 781
4f951399
DM
782 match read_meminfo() {
783 Ok(meminfo) => {
013fa7bb
DM
784 rrd_update_gauge("host/memtotal", meminfo.memtotal as f64, save);
785 rrd_update_gauge("host/memused", meminfo.memused as f64, save);
786 rrd_update_gauge("host/swaptotal", meminfo.swaptotal as f64, save);
787 rrd_update_gauge("host/swapused", meminfo.swapused as f64, save);
a4a3f7ca 788 }
4f951399
DM
789 Err(err) => {
790 eprintln!("read_meminfo failed - {}", err);
a4a3f7ca
DM
791 }
792 }
8f0cec26 793
4f951399
DM
794 match read_proc_net_dev() {
795 Ok(netdev) => {
6f422880 796 use pbs_config::network::is_physical_nic;
4f951399
DM
797 let mut netin = 0;
798 let mut netout = 0;
799 for item in netdev {
800 if !is_physical_nic(&item.device) { continue; }
801 netin += item.receive;
802 netout += item.send;
803 }
013fa7bb
DM
804 rrd_update_derive("host/netin", netin as f64, save);
805 rrd_update_derive("host/netout", netout as f64, save);
8f0cec26 806 }
4f951399
DM
807 Err(err) => {
808 eprintln!("read_prox_net_dev failed - {}", err);
8f0cec26
DM
809 }
810 }
dd15c0aa 811
485841da
DM
812 match read_loadavg() {
813 Ok(loadavg) => {
013fa7bb 814 rrd_update_gauge("host/loadavg", loadavg.0 as f64, save);
485841da
DM
815 }
816 Err(err) => {
817 eprintln!("read_loadavg failed - {}", err);
818 }
819 }
820
8c03041a
DM
821 let disk_manager = DiskManage::new();
822
013fa7bb 823 gather_disk_stats(disk_manager.clone(), Path::new("/"), "host", save);
91e5bb49 824
e7d4be9d 825 match pbs_config::datastore::config() {
d0833a70 826 Ok((config, _)) => {
e7d4be9d 827 let datastore_list: Vec<DataStoreConfig> =
17c7b46a 828 config.convert_to_typed_array("datastore").unwrap_or_default();
d0833a70
DM
829
830 for config in datastore_list {
8c03041a 831
91e5bb49 832 let rrd_prefix = format!("datastore/{}", config.name);
8c03041a 833 let path = std::path::Path::new(&config.path);
013fa7bb 834 gather_disk_stats(disk_manager.clone(), path, &rrd_prefix, save);
d0833a70
DM
835 }
836 }
837 Err(err) => {
838 eprintln!("read datastore config failed - {}", err);
839 }
840 }
841
4f951399 842 });
eaeda365 843}
dd15c0aa 844
b15751bf
DM
845fn check_schedule(worker_type: &str, event_str: &str, id: &str) -> bool {
846 let event = match parse_calendar_event(event_str) {
82c05b41
HL
847 Ok(event) => event,
848 Err(err) => {
849 eprintln!("unable to parse schedule '{}' - {}", event_str, err);
850 return false;
851 }
852 };
853
b15751bf 854 let last = match jobstate::last_run_time(worker_type, &id) {
82c05b41
HL
855 Ok(time) => time,
856 Err(err) => {
857 eprintln!("could not get last run time of {} {}: {}", worker_type, id, err);
858 return false;
859 }
860 };
861
862 let next = match compute_next_event(&event, last, false) {
863 Ok(Some(next)) => next,
864 Ok(None) => return false,
865 Err(err) => {
866 eprintln!("compute_next_event for '{}' failed - {}", event_str, err);
867 return false;
868 }
869 };
870
871 let now = proxmox::tools::time::epoch_i64();
872 next <= now
873}
874
013fa7bb 875fn gather_disk_stats(disk_manager: Arc<DiskManage>, path: &Path, rrd_prefix: &str, save: bool) {
91e5bb49 876
934f5bb8 877 match proxmox_backup::tools::disks::disk_usage(path) {
33070956 878 Ok(status) => {
91e5bb49 879 let rrd_key = format!("{}/total", rrd_prefix);
33070956 880 rrd_update_gauge(&rrd_key, status.total as f64, save);
91e5bb49 881 let rrd_key = format!("{}/used", rrd_prefix);
33070956 882 rrd_update_gauge(&rrd_key, status.used as f64, save);
91e5bb49
DM
883 }
884 Err(err) => {
885 eprintln!("read disk_usage on {:?} failed - {}", path, err);
886 }
887 }
888
934f5bb8
DM
889 match disk_manager.find_mounted_device(path) {
890 Ok(None) => {},
891 Ok(Some((fs_type, device, source))) => {
892 let mut device_stat = None;
893 match fs_type.as_str() {
894 "zfs" => {
368f4c54
DC
895 if let Some(source) = source {
896 let pool = get_pool_from_dataset(&source).unwrap_or(&source);
897 match zfs_pool_stats(pool) {
934f5bb8
DM
898 Ok(stat) => device_stat = stat,
899 Err(err) => eprintln!("zfs_pool_stats({:?}) failed - {}", pool, err),
91e5bb49
DM
900 }
901 }
934f5bb8
DM
902 }
903 _ => {
904 if let Ok(disk) = disk_manager.clone().disk_by_dev_num(device.into_dev_t()) {
905 match disk.read_stat() {
906 Ok(stat) => device_stat = stat,
907 Err(err) => eprintln!("disk.read_stat {:?} failed - {}", path, err),
91e5bb49
DM
908 }
909 }
910 }
91e5bb49 911 }
934f5bb8
DM
912 if let Some(stat) = device_stat {
913 let rrd_key = format!("{}/read_ios", rrd_prefix);
914 rrd_update_derive(&rrd_key, stat.read_ios as f64, save);
915 let rrd_key = format!("{}/read_bytes", rrd_prefix);
916 rrd_update_derive(&rrd_key, (stat.read_sectors*512) as f64, save);
dd15c0aa 917
934f5bb8
DM
918 let rrd_key = format!("{}/write_ios", rrd_prefix);
919 rrd_update_derive(&rrd_key, stat.write_ios as f64, save);
920 let rrd_key = format!("{}/write_bytes", rrd_prefix);
921 rrd_update_derive(&rrd_key, (stat.write_sectors*512) as f64, save);
dd15c0aa 922
934f5bb8
DM
923 let rrd_key = format!("{}/io_ticks", rrd_prefix);
924 rrd_update_derive(&rrd_key, (stat.io_ticks as f64)/1000.0, save);
8c03041a
DM
925 }
926 }
934f5bb8
DM
927 Err(err) => {
928 eprintln!("find_mounted_device failed - {}", err);
929 }
8c03041a 930 }
8c03041a 931}