]> git.proxmox.com Git - proxmox-backup.git/blame - src/bin/proxmox-backup-proxy.rs
refactor send_command
[proxmox-backup.git] / src / bin / proxmox-backup-proxy.rs
CommitLineData
71f413cd 1use std::sync::Arc;
2ab5acac 2use std::path::{Path, PathBuf};
a723c087 3use std::pin::Pin;
97168f92 4use std::os::unix::io::AsRawFd;
a2479cfa 5
f7d4e4b5 6use anyhow::{bail, format_err, Error};
a2479cfa 7use futures::*;
ea368a06 8
a2479cfa 9use openssl::ssl::{SslMethod, SslAcceptor, SslFiletype};
7c667013 10use tokio_stream::wrappers::ReceiverStream;
a723c087 11use serde_json::Value;
a2479cfa 12
9ea4bce4 13use proxmox::try_block;
a2479cfa
WB
14use proxmox::api::RpcEnvironmentType;
15
1298618a
DM
16use proxmox_backup::{
17 backup::DataStore,
18 server::{
26858dba 19 auth::default_api_auth,
1298618a
DM
20 WorkerTask,
21 ApiConfig,
22 rest::*,
23 jobstate::{
24 self,
25 Job,
26 },
27 rotate_task_log_archive,
28 },
29 tools::systemd::time::{
30 parse_calendar_event,
31 compute_next_event,
32 },
33};
34
35
1cd951c9 36use proxmox_backup::api2::types::Authid;
a2ca7137 37use proxmox_backup::configdir;
4a7de56e 38use proxmox_backup::buildcfg;
e3f41f21 39use proxmox_backup::server;
d01e2420 40use proxmox_backup::auth_helpers::*;
97168f92 41use proxmox_backup::tools::{
e4f5f59e 42 daemon,
97168f92
DM
43 disks::{
44 DiskManage,
45 zfs_pool_stats,
368f4c54 46 get_pool_from_dataset,
97168f92 47 },
fe4cc5b1 48 logrotate::LogRotate,
97168f92
DM
49 socket::{
50 set_tcp_keepalive,
51 PROXMOX_BACKUP_TCP_KEEPALIVE_TIME,
52 },
53};
02c7a755 54
a13573c2 55use proxmox_backup::api2::pull::do_sync_job;
8513626b 56use proxmox_backup::api2::tape::backup::do_tape_backup_job;
1298618a 57use proxmox_backup::server::do_verification_job;
b8d90798 58use proxmox_backup::server::do_prune_job;
a13573c2 59
946c3e8a 60fn main() -> Result<(), Error> {
ac7513e3
DM
61 proxmox_backup::tools::setup_safe_path_env();
62
843880f0
TL
63 let backup_uid = proxmox_backup::backup::backup_user()?.uid;
64 let backup_gid = proxmox_backup::backup::backup_group()?.gid;
65 let running_uid = nix::unistd::Uid::effective();
66 let running_gid = nix::unistd::Gid::effective();
67
68 if running_uid != backup_uid || running_gid != backup_gid {
69 bail!("proxy not running as backup user or group (got uid {} gid {})", running_uid, running_gid);
70 }
71
946c3e8a 72 proxmox_backup::tools::runtime::main(run())
4223d9f8
DM
73}
74
fda5797b 75async fn run() -> Result<(), Error> {
02c7a755
DM
76 if let Err(err) = syslog::init(
77 syslog::Facility::LOG_DAEMON,
78 log::LevelFilter::Info,
79 Some("proxmox-backup-proxy")) {
4223d9f8 80 bail!("unable to inititialize syslog - {}", err);
02c7a755
DM
81 }
82
e1d367df
DM
83 // Note: To debug early connection error use
84 // PROXMOX_DEBUG=1 ./target/release/proxmox-backup-proxy
85 let debug = std::env::var("PROXMOX_DEBUG").is_ok();
86
d01e2420
DM
87 let _ = public_auth_key(); // load with lazy_static
88 let _ = csrf_secret(); // load with lazy_static
89
02c7a755 90 let mut config = ApiConfig::new(
26858dba
SR
91 buildcfg::JS_DIR,
92 &proxmox_backup::api2::ROUTER,
93 RpcEnvironmentType::PUBLIC,
94 default_api_auth(),
95 )?;
02c7a755 96
02c7a755
DM
97 config.add_alias("novnc", "/usr/share/novnc-pve");
98 config.add_alias("extjs", "/usr/share/javascript/extjs");
7f066a9b 99 config.add_alias("qrcodejs", "/usr/share/javascript/qrcodejs");
02c7a755
DM
100 config.add_alias("fontawesome", "/usr/share/fonts-font-awesome");
101 config.add_alias("xtermjs", "/usr/share/pve-xtermjs");
abd4c4cb 102 config.add_alias("locale", "/usr/share/pbs-i18n");
02c7a755 103 config.add_alias("widgettoolkit", "/usr/share/javascript/proxmox-widget-toolkit");
9c01e73c 104 config.add_alias("docs", "/usr/share/doc/proxmox-backup/html");
02c7a755 105
2ab5acac
DC
106 let mut indexpath = PathBuf::from(buildcfg::JS_DIR);
107 indexpath.push("index.hbs");
108 config.register_template("index", &indexpath)?;
01ca99da 109 config.register_template("console", "/usr/share/pve-xtermjs/index.html.hbs")?;
2ab5acac 110
a68768cf
TL
111 let mut commando_sock = server::CommandoSocket::new(server::our_ctrl_sock());
112
fe4cc5b1 113 config.enable_file_log(buildcfg::API_ACCESS_LOG_FN, &mut commando_sock)?;
8e7e2223 114
02c7a755
DM
115 let rest_server = RestServer::new(config);
116
6d1f61b2 117 //openssl req -x509 -newkey rsa:4096 -keyout /etc/proxmox-backup/proxy.key -out /etc/proxmox-backup/proxy.pem -nodes
6d1f61b2 118
c381a162
WB
119 // we build the initial acceptor here as we cannot start if this fails - certificate reloads
120 // will be handled inside the accept loop and simply log an error if we cannot load the new
121 // certificate!
122 let acceptor = make_tls_acceptor()?;
6d1f61b2 123
a723c087
WB
124 // to renew the acceptor we just let a command-socket handler trigger a Notify:
125 let notify_tls_cert_reload = Arc::new(tokio::sync::Notify::new());
126 commando_sock.register_command(
127 "reload-certificate".to_string(),
128 {
129 let notify_tls_cert_reload = Arc::clone(&notify_tls_cert_reload);
130 move |_value| -> Result<_, Error> {
131 notify_tls_cert_reload.notify_one();
132 Ok(Value::Null)
133 }
134 },
135 )?;
0d176f36 136
a690ecac
WB
137 let server = daemon::create_daemon(
138 ([0,0,0,0,0,0,0,0], 8007).into(),
a723c087 139 move |listener, ready| {
97168f92 140
a723c087 141 let connections = accept_connections(listener, acceptor, debug, notify_tls_cert_reload);
7c667013 142 let connections = hyper::server::accept::from_stream(ReceiverStream::new(connections));
083ff3fd
WB
143
144 Ok(ready
48aa2b93 145 .and_then(|_| hyper::Server::builder(connections)
083ff3fd
WB
146 .serve(rest_server)
147 .with_graceful_shutdown(server::shutdown_future())
148 .map_err(Error::from)
149 )
150 .map_err(|err| eprintln!("server error: {}", err))
151 .map(|_| ())
a690ecac 152 )
a2ca7137 153 },
d7c6ad60 154 "proxmox-backup-proxy.service",
083ff3fd 155 );
a2ca7137 156
04b053d8 157 server::write_pid(buildcfg::PROXMOX_BACKUP_PROXY_PID_FN)?;
d98c9a7a
WB
158 daemon::systemd_notify(daemon::SystemdNotify::Ready)?;
159
fda5797b 160 let init_result: Result<(), Error> = try_block!({
a68768cf
TL
161 server::register_task_control_commands(&mut commando_sock)?;
162 commando_sock.spawn()?;
fda5797b
WB
163 server::server_state_init()?;
164 Ok(())
165 });
d607b886 166
fda5797b
WB
167 if let Err(err) = init_result {
168 bail!("unable to start daemon - {}", err);
169 }
e3f41f21 170
8545480a 171 start_task_scheduler();
eaeda365 172 start_stat_generator();
8545480a 173
083ff3fd 174 server.await?;
a546a8a0
WB
175 log::info!("server shutting down, waiting for active workers to complete");
176 proxmox_backup::server::last_worker_future().await?;
fda5797b 177 log::info!("done - exit server");
e3f41f21 178
4223d9f8 179 Ok(())
02c7a755 180}
8545480a 181
c381a162
WB
182fn make_tls_acceptor() -> Result<Arc<SslAcceptor>, Error> {
183 let key_path = configdir!("/proxy.key");
184 let cert_path = configdir!("/proxy.pem");
185
186 let mut acceptor = SslAcceptor::mozilla_intermediate_v5(SslMethod::tls()).unwrap();
187 acceptor.set_private_key_file(key_path, SslFiletype::PEM)
188 .map_err(|err| format_err!("unable to read proxy key {} - {}", key_path, err))?;
189 acceptor.set_certificate_chain_file(cert_path)
190 .map_err(|err| format_err!("unable to read proxy cert {} - {}", cert_path, err))?;
191 acceptor.check_private_key().unwrap();
192
193 Ok(Arc::new(acceptor.build()))
194}
195
a5e3be49
WB
196type ClientStreamResult =
197 Result<std::pin::Pin<Box<tokio_openssl::SslStream<tokio::net::TcpStream>>>, Error>;
198const MAX_PENDING_ACCEPTS: usize = 1024;
199
48aa2b93 200fn accept_connections(
0bfcea6a 201 listener: tokio::net::TcpListener,
48aa2b93 202 acceptor: Arc<openssl::ssl::SslAcceptor>,
e1d367df 203 debug: bool,
a723c087 204 notify_tls_cert_reload: Arc<tokio::sync::Notify>,
a5e3be49 205) -> tokio::sync::mpsc::Receiver<ClientStreamResult> {
48aa2b93 206
ea93bea7 207 let (sender, receiver) = tokio::sync::mpsc::channel(MAX_PENDING_ACCEPTS);
48aa2b93 208
a723c087 209 tokio::spawn(accept_connection(listener, acceptor, debug, sender, notify_tls_cert_reload));
a5e3be49
WB
210
211 receiver
212}
213
214async fn accept_connection(
215 listener: tokio::net::TcpListener,
a723c087 216 mut acceptor: Arc<openssl::ssl::SslAcceptor>,
a5e3be49
WB
217 debug: bool,
218 sender: tokio::sync::mpsc::Sender<ClientStreamResult>,
a723c087 219 notify_tls_cert_reload: Arc<tokio::sync::Notify>,
a5e3be49 220) {
ea93bea7 221 let accept_counter = Arc::new(());
48aa2b93 222
a723c087
WB
223 // Note that these must not be moved out/modified directly, they get pinned in the loop and
224 // "rearmed" after waking up:
225 let mut reload_tls = notify_tls_cert_reload.notified();
226 let mut accept = listener.accept();
227
a5e3be49 228 loop {
a723c087
WB
229 let sock;
230
231 // normally we'd use `tokio::pin!()` but we need this to happen outside the loop and we
232 // need to be able to "rearm" the futures:
233 let reload_tls_pin = unsafe { Pin::new_unchecked(&mut reload_tls) };
234 let accept_pin = unsafe { Pin::new_unchecked(&mut accept) };
235 tokio::select! {
236 _ = reload_tls_pin => {
237 // rearm the notification:
238 reload_tls = notify_tls_cert_reload.notified();
239
240 log::info!("reloading certificate");
241 match make_tls_acceptor() {
242 Err(err) => eprintln!("error reloading certificate: {}", err),
243 Ok(new_acceptor) => acceptor = new_acceptor,
244 }
cc269b9f 245 continue;
a5e3be49 246 }
a723c087
WB
247 res = accept_pin => match res {
248 Err(err) => {
249 eprintln!("error accepting tcp connection: {}", err);
250 continue;
251 }
252 Ok((new_sock, _addr)) => {
253 // rearm the accept future:
254 accept = listener.accept();
255
256 sock = new_sock;
257 }
258 }
cc269b9f 259 };
48aa2b93 260
cc269b9f
WB
261 sock.set_nodelay(true).unwrap();
262 let _ = set_tcp_keepalive(sock.as_raw_fd(), PROXMOX_BACKUP_TCP_KEEPALIVE_TIME);
263 let acceptor = Arc::clone(&acceptor);
48aa2b93 264
cc269b9f
WB
265 let ssl = match openssl::ssl::Ssl::new(acceptor.context()) {
266 Ok(ssl) => ssl,
267 Err(err) => {
268 eprintln!("failed to create Ssl object from Acceptor context - {}", err);
269 continue;
270 },
271 };
272 let stream = match tokio_openssl::SslStream::new(ssl, sock) {
273 Ok(stream) => stream,
274 Err(err) => {
275 eprintln!("failed to create SslStream using ssl and connection socket - {}", err);
276 continue;
277 },
278 };
279
280 let mut stream = Box::pin(stream);
281 let sender = sender.clone();
282
283 if Arc::strong_count(&accept_counter) > MAX_PENDING_ACCEPTS {
284 eprintln!("connection rejected - to many open connections");
285 continue;
48aa2b93 286 }
cc269b9f 287
b4931192 288 let accept_counter = Arc::clone(&accept_counter);
cc269b9f
WB
289 tokio::spawn(async move {
290 let accept_future = tokio::time::timeout(
291 Duration::new(10, 0), stream.as_mut().accept());
292
293 let result = accept_future.await;
294
295 match result {
296 Ok(Ok(())) => {
297 if sender.send(Ok(stream)).await.is_err() && debug {
298 eprintln!("detect closed connection channel");
299 }
300 }
301 Ok(Err(err)) => {
302 if debug {
303 eprintln!("https handshake failed - {}", err);
304 }
305 }
306 Err(_) => {
307 if debug {
308 eprintln!("https handshake timeout");
309 }
310 }
311 }
312
313 drop(accept_counter); // decrease reference count
314 });
a5e3be49 315 }
48aa2b93
DM
316}
317
eaeda365
DM
318fn start_stat_generator() {
319 let abort_future = server::shutdown_future();
320 let future = Box::pin(run_stat_generator());
321 let task = futures::future::select(future, abort_future);
322 tokio::spawn(task.map(|_| ()));
323}
324
8545480a
DM
325fn start_task_scheduler() {
326 let abort_future = server::shutdown_future();
327 let future = Box::pin(run_task_scheduler());
328 let task = futures::future::select(future, abort_future);
329 tokio::spawn(task.map(|_| ()));
330}
331
6a7be83e 332use std::time::{SystemTime, Instant, Duration, UNIX_EPOCH};
8545480a
DM
333
334fn next_minute() -> Result<Instant, Error> {
6a7be83e
DM
335 let now = SystemTime::now();
336 let epoch_now = now.duration_since(UNIX_EPOCH)?;
337 let epoch_next = Duration::from_secs((epoch_now.as_secs()/60 + 1)*60);
8545480a
DM
338 Ok(Instant::now() + epoch_next - epoch_now)
339}
340
341async fn run_task_scheduler() {
342
343 let mut count: usize = 0;
344
345 loop {
346 count += 1;
347
348 let delay_target = match next_minute() { // try to run very minute
349 Ok(d) => d,
350 Err(err) => {
351 eprintln!("task scheduler: compute next minute failed - {}", err);
0a8d773a 352 tokio::time::sleep_until(tokio::time::Instant::from_std(Instant::now() + Duration::from_secs(60))).await;
8545480a
DM
353 continue;
354 }
355 };
356
357 if count > 2 { // wait 1..2 minutes before starting
358 match schedule_tasks().catch_unwind().await {
359 Err(panic) => {
360 match panic.downcast::<&str>() {
361 Ok(msg) => {
362 eprintln!("task scheduler panic: {}", msg);
363 }
364 Err(_) => {
365 eprintln!("task scheduler panic - unknown type");
366 }
367 }
368 }
369 Ok(Err(err)) => {
370 eprintln!("task scheduler failed - {:?}", err);
371 }
372 Ok(Ok(_)) => {}
373 }
374 }
375
0a8d773a 376 tokio::time::sleep_until(tokio::time::Instant::from_std(delay_target)).await;
8545480a
DM
377 }
378}
379
380async fn schedule_tasks() -> Result<(), Error> {
381
382 schedule_datastore_garbage_collection().await;
25829a87 383 schedule_datastore_prune().await;
a6160cdf 384 schedule_datastore_sync_jobs().await;
73df9c51 385 schedule_datastore_verify_jobs().await;
8513626b 386 schedule_tape_backup_jobs().await;
9a760917 387 schedule_task_log_rotate().await;
8545480a
DM
388
389 Ok(())
390}
391
8545480a
DM
392async fn schedule_datastore_garbage_collection() {
393
b9e7bcc2
DM
394 use proxmox_backup::config::{
395 datastore::{
396 self,
397 DataStoreConfig,
398 },
d7a122a0 399 };
8545480a 400
25829a87 401 let config = match datastore::config() {
8545480a
DM
402 Err(err) => {
403 eprintln!("unable to read datastore config - {}", err);
404 return;
405 }
406 Ok((config, _digest)) => config,
407 };
408
409 for (store, (_, store_config)) in config.sections {
410 let datastore = match DataStore::lookup_datastore(&store) {
411 Ok(datastore) => datastore,
412 Err(err) => {
413 eprintln!("lookup_datastore failed - {}", err);
414 continue;
415 }
416 };
417
25829a87 418 let store_config: DataStoreConfig = match serde_json::from_value(store_config) {
8545480a
DM
419 Ok(c) => c,
420 Err(err) => {
421 eprintln!("datastore config from_value failed - {}", err);
422 continue;
423 }
424 };
425
426 let event_str = match store_config.gc_schedule {
427 Some(event_str) => event_str,
428 None => continue,
429 };
430
431 let event = match parse_calendar_event(&event_str) {
432 Ok(event) => event,
433 Err(err) => {
434 eprintln!("unable to parse schedule '{}' - {}", event_str, err);
435 continue;
436 }
437 };
438
439 if datastore.garbage_collection_running() { continue; }
440
441 let worker_type = "garbage_collection";
442
b6ba5acd
DC
443 let last = match jobstate::last_run_time(worker_type, &store) {
444 Ok(time) => time,
445 Err(err) => {
446 eprintln!("could not get last run time of {} {}: {}", worker_type, store, err);
447 continue;
8545480a
DM
448 }
449 };
450
451 let next = match compute_next_event(&event, last, false) {
15ec790a
DC
452 Ok(Some(next)) => next,
453 Ok(None) => continue,
8545480a
DM
454 Err(err) => {
455 eprintln!("compute_next_event for '{}' failed - {}", event_str, err);
456 continue;
457 }
458 };
e693818a 459
6a7be83e
DM
460 let now = proxmox::tools::time::epoch_i64();
461
8545480a
DM
462 if next > now { continue; }
463
1cd951c9 464 let job = match Job::new(worker_type, &store) {
d7a122a0
DC
465 Ok(job) => job,
466 Err(_) => continue, // could not get lock
467 };
468
ad54df31 469 let auth_id = Authid::root_auth_id();
d7a122a0 470
c724f658 471 if let Err(err) = crate::server::do_garbage_collection_job(job, datastore, auth_id, Some(event_str), false) {
3b707fbb 472 eprintln!("unable to start garbage collection job on datastore {} - {}", store, err);
8545480a
DM
473 }
474 }
475}
25829a87
DM
476
477async fn schedule_datastore_prune() {
478
1298618a
DM
479 use proxmox_backup::{
480 backup::{
481 PruneOptions,
1298618a
DM
482 },
483 config::datastore::{
484 self,
485 DataStoreConfig,
486 },
9866de5e 487 };
25829a87
DM
488
489 let config = match datastore::config() {
490 Err(err) => {
491 eprintln!("unable to read datastore config - {}", err);
492 return;
493 }
494 Ok((config, _digest)) => config,
495 };
496
497 for (store, (_, store_config)) in config.sections {
25829a87
DM
498
499 let store_config: DataStoreConfig = match serde_json::from_value(store_config) {
500 Ok(c) => c,
501 Err(err) => {
a6160cdf 502 eprintln!("datastore '{}' config from_value failed - {}", store, err);
25829a87
DM
503 continue;
504 }
505 };
506
507 let event_str = match store_config.prune_schedule {
508 Some(event_str) => event_str,
509 None => continue,
510 };
511
512 let prune_options = PruneOptions {
513 keep_last: store_config.keep_last,
514 keep_hourly: store_config.keep_hourly,
515 keep_daily: store_config.keep_daily,
516 keep_weekly: store_config.keep_weekly,
517 keep_monthly: store_config.keep_monthly,
518 keep_yearly: store_config.keep_yearly,
519 };
520
521 if !prune_options.keeps_something() { // no prune settings - keep all
522 continue;
523 }
524
25829a87 525 let worker_type = "prune";
b15751bf 526 if check_schedule(worker_type, &event_str, &store) {
82c05b41
HL
527 let job = match Job::new(worker_type, &store) {
528 Ok(job) => job,
529 Err(_) => continue, // could not get lock
530 };
25829a87 531
ad54df31 532 let auth_id = Authid::root_auth_id().clone();
82c05b41
HL
533 if let Err(err) = do_prune_job(job, prune_options, store.clone(), &auth_id, Some(event_str)) {
534 eprintln!("unable to start datastore prune job {} - {}", &store, err);
25829a87
DM
535 }
536 };
25829a87
DM
537 }
538}
a6160cdf
DM
539
540async fn schedule_datastore_sync_jobs() {
541
1298618a
DM
542 use proxmox_backup::config::sync::{
543 self,
544 SyncJobConfig,
a6160cdf
DM
545 };
546
547 let config = match sync::config() {
548 Err(err) => {
549 eprintln!("unable to read sync job config - {}", err);
550 return;
551 }
552 Ok((config, _digest)) => config,
553 };
554
a6160cdf
DM
555 for (job_id, (_, job_config)) in config.sections {
556 let job_config: SyncJobConfig = match serde_json::from_value(job_config) {
557 Ok(c) => c,
558 Err(err) => {
559 eprintln!("sync job config from_value failed - {}", err);
560 continue;
561 }
562 };
563
564 let event_str = match job_config.schedule {
565 Some(ref event_str) => event_str.clone(),
566 None => continue,
567 };
568
c67b1fa7 569 let worker_type = "syncjob";
b15751bf 570 if check_schedule(worker_type, &event_str, &job_id) {
82c05b41
HL
571 let job = match Job::new(worker_type, &job_id) {
572 Ok(job) => job,
573 Err(_) => continue, // could not get lock
574 };
a6160cdf 575
ad54df31 576 let auth_id = Authid::root_auth_id().clone();
82c05b41
HL
577 if let Err(err) = do_sync_job(job, job_config, &auth_id, Some(event_str)) {
578 eprintln!("unable to start datastore sync job {} - {}", &job_id, err);
a6160cdf
DM
579 }
580 };
a6160cdf
DM
581 }
582}
eaeda365 583
73df9c51 584async fn schedule_datastore_verify_jobs() {
1298618a
DM
585
586 use proxmox_backup::config::verify::{
587 self,
588 VerificationJobConfig,
73df9c51 589 };
1298618a 590
73df9c51
HL
591 let config = match verify::config() {
592 Err(err) => {
593 eprintln!("unable to read verification job config - {}", err);
594 return;
595 }
596 Ok((config, _digest)) => config,
597 };
598 for (job_id, (_, job_config)) in config.sections {
599 let job_config: VerificationJobConfig = match serde_json::from_value(job_config) {
600 Ok(c) => c,
601 Err(err) => {
602 eprintln!("verification job config from_value failed - {}", err);
603 continue;
604 }
605 };
606 let event_str = match job_config.schedule {
607 Some(ref event_str) => event_str.clone(),
608 None => continue,
609 };
82c05b41 610
73df9c51 611 let worker_type = "verificationjob";
ad54df31 612 let auth_id = Authid::root_auth_id().clone();
b15751bf 613 if check_schedule(worker_type, &event_str, &job_id) {
82c05b41
HL
614 let job = match Job::new(&worker_type, &job_id) {
615 Ok(job) => job,
616 Err(_) => continue, // could not get lock
617 };
618 if let Err(err) = do_verification_job(job, job_config, &auth_id, Some(event_str)) {
619 eprintln!("unable to start datastore verification job {} - {}", &job_id, err);
73df9c51
HL
620 }
621 };
73df9c51
HL
622 }
623}
624
8513626b
DM
625async fn schedule_tape_backup_jobs() {
626
627 use proxmox_backup::config::tape_job::{
628 self,
629 TapeBackupJobConfig,
630 };
631
632 let config = match tape_job::config() {
633 Err(err) => {
634 eprintln!("unable to read tape job config - {}", err);
635 return;
636 }
637 Ok((config, _digest)) => config,
638 };
639 for (job_id, (_, job_config)) in config.sections {
640 let job_config: TapeBackupJobConfig = match serde_json::from_value(job_config) {
641 Ok(c) => c,
642 Err(err) => {
643 eprintln!("tape backup job config from_value failed - {}", err);
644 continue;
645 }
646 };
647 let event_str = match job_config.schedule {
648 Some(ref event_str) => event_str.clone(),
649 None => continue,
650 };
651
652 let worker_type = "tape-backup-job";
653 let auth_id = Authid::root_auth_id().clone();
654 if check_schedule(worker_type, &event_str, &job_id) {
655 let job = match Job::new(&worker_type, &job_id) {
656 Ok(job) => job,
657 Err(_) => continue, // could not get lock
658 };
5830e562 659 if let Err(err) = do_tape_backup_job(job, job_config.setup, &auth_id, Some(event_str)) {
7a61f89e 660 eprintln!("unable to start tape backup job {} - {}", &job_id, err);
8513626b
DM
661 }
662 };
663 }
664}
665
666
9a760917 667async fn schedule_task_log_rotate() {
9a760917
DC
668
669 let worker_type = "logrotate";
72aa1834 670 let job_id = "access-log_and_task-archive";
9a760917 671
9a760917
DC
672 // schedule daily at 00:00 like normal logrotate
673 let schedule = "00:00";
674
b15751bf 675 if !check_schedule(worker_type, schedule, job_id) {
9a760917
DC
676 // if we never ran the rotation, schedule instantly
677 match jobstate::JobState::load(worker_type, job_id) {
678 Ok(state) => match state {
679 jobstate::JobState::Created { .. } => {},
680 _ => return,
681 },
682 _ => return,
683 }
684 }
685
686 let mut job = match Job::new(worker_type, job_id) {
687 Ok(job) => job,
688 Err(_) => return, // could not get lock
689 };
690
691 if let Err(err) = WorkerTask::new_thread(
692 worker_type,
72aa1834 693 None,
ad54df31 694 Authid::root_auth_id().clone(),
9a760917
DC
695 false,
696 move |worker| {
697 job.start(&worker.upid().to_string())?;
3b82f3ee 698 worker.log("starting task log rotation".to_string());
e4f5f59e 699
9a760917 700 let result = try_block!({
b7f2be51
TL
701 let max_size = 512 * 1024 - 1; // an entry has ~ 100b, so > 5000 entries/file
702 let max_files = 20; // times twenty files gives > 100000 task entries
9a760917
DC
703 let has_rotated = rotate_task_log_archive(max_size, true, Some(max_files))?;
704 if has_rotated {
3b82f3ee 705 worker.log("task log archive was rotated".to_string());
9a760917 706 } else {
3b82f3ee 707 worker.log("task log archive was not rotated".to_string());
9a760917
DC
708 }
709
fe4cc5b1
TL
710 let max_size = 32 * 1024 * 1024 - 1;
711 let max_files = 14;
712 let mut logrotate = LogRotate::new(buildcfg::API_ACCESS_LOG_FN, true)
713 .ok_or_else(|| format_err!("could not get API access log file names"))?;
714
fe7bdc9d 715 if logrotate.rotate(max_size, None, Some(max_files))? {
fe4cc5b1
TL
716 println!("rotated access log, telling daemons to re-open log file");
717 proxmox_backup::tools::runtime::block_on(command_reopen_logfiles())?;
3b82f3ee 718 worker.log("API access log was rotated".to_string());
fe7bdc9d 719 } else {
3b82f3ee 720 worker.log("API access log was not rotated".to_string());
fe7bdc9d
TL
721 }
722
723 let mut logrotate = LogRotate::new(buildcfg::API_AUTH_LOG_FN, true)
724 .ok_or_else(|| format_err!("could not get API auth log file names"))?;
fe4cc5b1 725
fe7bdc9d 726 if logrotate.rotate(max_size, None, Some(max_files))? {
3b82f3ee 727 worker.log("API authentication log was rotated".to_string());
fe4cc5b1 728 } else {
3b82f3ee 729 worker.log("API authentication log was not rotated".to_string());
fe4cc5b1
TL
730 }
731
9a760917
DC
732 Ok(())
733 });
734
735 let status = worker.create_state(&result);
736
737 if let Err(err) = job.finish(status) {
738 eprintln!("could not finish job state for {}: {}", worker_type, err);
739 }
740
741 result
742 },
743 ) {
744 eprintln!("unable to start task log rotation: {}", err);
745 }
746
747}
748
fe4cc5b1
TL
749async fn command_reopen_logfiles() -> Result<(), Error> {
750 // only care about the most recent daemon instance for each, proxy & api, as other older ones
751 // should not respond to new requests anyway, but only finish their current one and then exit.
752 let sock = server::our_ctrl_sock();
45b8a032 753 let f1 = server::send_command(sock, "{\"command\":\"api-access-log-reopen\"}\n");
fe4cc5b1
TL
754
755 let pid = server::read_pid(buildcfg::PROXMOX_BACKUP_API_PID_FN)?;
756 let sock = server::ctrl_sock_from_pid(pid);
45b8a032 757 let f2 = server::send_command(sock, "{\"command\":\"api-access-log-reopen\"}\n");
546b6a23
TL
758
759 match futures::join!(f1, f2) {
760 (Err(e1), Err(e2)) => Err(format_err!("reopen commands failed, proxy: {}; api: {}", e1, e2)),
761 (Err(e1), Ok(_)) => Err(format_err!("reopen commands failed, proxy: {}", e1)),
762 (Ok(_), Err(e2)) => Err(format_err!("reopen commands failed, api: {}", e2)),
763 _ => Ok(()),
764 }
fe4cc5b1
TL
765}
766
eaeda365
DM
767async fn run_stat_generator() {
768
013fa7bb 769 let mut count = 0;
eaeda365 770 loop {
013fa7bb 771 count += 1;
a720894f 772 let save = if count >= 6 { count = 0; true } else { false };
013fa7bb 773
eaeda365
DM
774 let delay_target = Instant::now() + Duration::from_secs(10);
775
013fa7bb 776 generate_host_stats(save).await;
eaeda365 777
0a8d773a 778 tokio::time::sleep_until(tokio::time::Instant::from_std(delay_target)).await;
013fa7bb
DM
779
780 }
eaeda365
DM
781
782}
783
013fa7bb 784fn rrd_update_gauge(name: &str, value: f64, save: bool) {
309ef20d 785 use proxmox_backup::rrd;
013fa7bb 786 if let Err(err) = rrd::update_value(name, value, rrd::DST::Gauge, save) {
309ef20d
DM
787 eprintln!("rrd::update_value '{}' failed - {}", name, err);
788 }
789}
790
013fa7bb 791fn rrd_update_derive(name: &str, value: f64, save: bool) {
309ef20d 792 use proxmox_backup::rrd;
013fa7bb 793 if let Err(err) = rrd::update_value(name, value, rrd::DST::Derive, save) {
309ef20d
DM
794 eprintln!("rrd::update_value '{}' failed - {}", name, err);
795 }
796}
797
013fa7bb 798async fn generate_host_stats(save: bool) {
8f0cec26 799 use proxmox::sys::linux::procfs::{
485841da 800 read_meminfo, read_proc_stat, read_proc_net_dev, read_loadavg};
309ef20d 801 use proxmox_backup::config::datastore;
8c03041a 802
eaeda365 803
4f951399
DM
804 proxmox_backup::tools::runtime::block_in_place(move || {
805
806 match read_proc_stat() {
807 Ok(stat) => {
013fa7bb
DM
808 rrd_update_gauge("host/cpu", stat.cpu, save);
809 rrd_update_gauge("host/iowait", stat.iowait_percent, save);
4f951399
DM
810 }
811 Err(err) => {
812 eprintln!("read_proc_stat failed - {}", err);
eaeda365
DM
813 }
814 }
2c66a590 815
4f951399
DM
816 match read_meminfo() {
817 Ok(meminfo) => {
013fa7bb
DM
818 rrd_update_gauge("host/memtotal", meminfo.memtotal as f64, save);
819 rrd_update_gauge("host/memused", meminfo.memused as f64, save);
820 rrd_update_gauge("host/swaptotal", meminfo.swaptotal as f64, save);
821 rrd_update_gauge("host/swapused", meminfo.swapused as f64, save);
a4a3f7ca 822 }
4f951399
DM
823 Err(err) => {
824 eprintln!("read_meminfo failed - {}", err);
a4a3f7ca
DM
825 }
826 }
8f0cec26 827
4f951399
DM
828 match read_proc_net_dev() {
829 Ok(netdev) => {
830 use proxmox_backup::config::network::is_physical_nic;
831 let mut netin = 0;
832 let mut netout = 0;
833 for item in netdev {
834 if !is_physical_nic(&item.device) { continue; }
835 netin += item.receive;
836 netout += item.send;
837 }
013fa7bb
DM
838 rrd_update_derive("host/netin", netin as f64, save);
839 rrd_update_derive("host/netout", netout as f64, save);
8f0cec26 840 }
4f951399
DM
841 Err(err) => {
842 eprintln!("read_prox_net_dev failed - {}", err);
8f0cec26
DM
843 }
844 }
dd15c0aa 845
485841da
DM
846 match read_loadavg() {
847 Ok(loadavg) => {
013fa7bb 848 rrd_update_gauge("host/loadavg", loadavg.0 as f64, save);
485841da
DM
849 }
850 Err(err) => {
851 eprintln!("read_loadavg failed - {}", err);
852 }
853 }
854
8c03041a
DM
855 let disk_manager = DiskManage::new();
856
013fa7bb 857 gather_disk_stats(disk_manager.clone(), Path::new("/"), "host", save);
91e5bb49 858
d0833a70
DM
859 match datastore::config() {
860 Ok((config, _)) => {
861 let datastore_list: Vec<datastore::DataStoreConfig> =
17c7b46a 862 config.convert_to_typed_array("datastore").unwrap_or_default();
d0833a70
DM
863
864 for config in datastore_list {
8c03041a 865
91e5bb49 866 let rrd_prefix = format!("datastore/{}", config.name);
8c03041a 867 let path = std::path::Path::new(&config.path);
013fa7bb 868 gather_disk_stats(disk_manager.clone(), path, &rrd_prefix, save);
d0833a70
DM
869 }
870 }
871 Err(err) => {
872 eprintln!("read datastore config failed - {}", err);
873 }
874 }
875
4f951399 876 });
eaeda365 877}
dd15c0aa 878
b15751bf
DM
879fn check_schedule(worker_type: &str, event_str: &str, id: &str) -> bool {
880 let event = match parse_calendar_event(event_str) {
82c05b41
HL
881 Ok(event) => event,
882 Err(err) => {
883 eprintln!("unable to parse schedule '{}' - {}", event_str, err);
884 return false;
885 }
886 };
887
b15751bf 888 let last = match jobstate::last_run_time(worker_type, &id) {
82c05b41
HL
889 Ok(time) => time,
890 Err(err) => {
891 eprintln!("could not get last run time of {} {}: {}", worker_type, id, err);
892 return false;
893 }
894 };
895
896 let next = match compute_next_event(&event, last, false) {
897 Ok(Some(next)) => next,
898 Ok(None) => return false,
899 Err(err) => {
900 eprintln!("compute_next_event for '{}' failed - {}", event_str, err);
901 return false;
902 }
903 };
904
905 let now = proxmox::tools::time::epoch_i64();
906 next <= now
907}
908
013fa7bb 909fn gather_disk_stats(disk_manager: Arc<DiskManage>, path: &Path, rrd_prefix: &str, save: bool) {
91e5bb49 910
934f5bb8 911 match proxmox_backup::tools::disks::disk_usage(path) {
33070956 912 Ok(status) => {
91e5bb49 913 let rrd_key = format!("{}/total", rrd_prefix);
33070956 914 rrd_update_gauge(&rrd_key, status.total as f64, save);
91e5bb49 915 let rrd_key = format!("{}/used", rrd_prefix);
33070956 916 rrd_update_gauge(&rrd_key, status.used as f64, save);
91e5bb49
DM
917 }
918 Err(err) => {
919 eprintln!("read disk_usage on {:?} failed - {}", path, err);
920 }
921 }
922
934f5bb8
DM
923 match disk_manager.find_mounted_device(path) {
924 Ok(None) => {},
925 Ok(Some((fs_type, device, source))) => {
926 let mut device_stat = None;
927 match fs_type.as_str() {
928 "zfs" => {
368f4c54
DC
929 if let Some(source) = source {
930 let pool = get_pool_from_dataset(&source).unwrap_or(&source);
931 match zfs_pool_stats(pool) {
934f5bb8
DM
932 Ok(stat) => device_stat = stat,
933 Err(err) => eprintln!("zfs_pool_stats({:?}) failed - {}", pool, err),
91e5bb49
DM
934 }
935 }
934f5bb8
DM
936 }
937 _ => {
938 if let Ok(disk) = disk_manager.clone().disk_by_dev_num(device.into_dev_t()) {
939 match disk.read_stat() {
940 Ok(stat) => device_stat = stat,
941 Err(err) => eprintln!("disk.read_stat {:?} failed - {}", path, err),
91e5bb49
DM
942 }
943 }
944 }
91e5bb49 945 }
934f5bb8
DM
946 if let Some(stat) = device_stat {
947 let rrd_key = format!("{}/read_ios", rrd_prefix);
948 rrd_update_derive(&rrd_key, stat.read_ios as f64, save);
949 let rrd_key = format!("{}/read_bytes", rrd_prefix);
950 rrd_update_derive(&rrd_key, (stat.read_sectors*512) as f64, save);
dd15c0aa 951
934f5bb8
DM
952 let rrd_key = format!("{}/write_ios", rrd_prefix);
953 rrd_update_derive(&rrd_key, stat.write_ios as f64, save);
954 let rrd_key = format!("{}/write_bytes", rrd_prefix);
955 rrd_update_derive(&rrd_key, (stat.write_sectors*512) as f64, save);
dd15c0aa 956
934f5bb8
DM
957 let rrd_key = format!("{}/io_ticks", rrd_prefix);
958 rrd_update_derive(&rrd_key, (stat.io_ticks as f64)/1000.0, save);
8c03041a
DM
959 }
960 }
934f5bb8
DM
961 Err(err) => {
962 eprintln!("find_mounted_device failed - {}", err);
963 }
8c03041a 964 }
8c03041a 965}