]>
Commit | Line | Data |
---|---|---|
71f413cd | 1 | use std::sync::Arc; |
2ab5acac | 2 | use std::path::{Path, PathBuf}; |
97168f92 | 3 | use std::os::unix::io::AsRawFd; |
a2479cfa | 4 | |
f7d4e4b5 | 5 | use anyhow::{bail, format_err, Error}; |
a2479cfa WB |
6 | use futures::*; |
7 | use hyper; | |
8 | use openssl::ssl::{SslMethod, SslAcceptor, SslFiletype}; | |
9 | ||
9ea4bce4 | 10 | use proxmox::try_block; |
a2479cfa WB |
11 | use proxmox::api::RpcEnvironmentType; |
12 | ||
1298618a DM |
13 | use proxmox_backup::{ |
14 | backup::DataStore, | |
15 | server::{ | |
1298618a DM |
16 | WorkerTask, |
17 | ApiConfig, | |
18 | rest::*, | |
19 | jobstate::{ | |
20 | self, | |
21 | Job, | |
22 | }, | |
23 | rotate_task_log_archive, | |
24 | }, | |
25 | tools::systemd::time::{ | |
26 | parse_calendar_event, | |
27 | compute_next_event, | |
28 | }, | |
29 | }; | |
30 | ||
31 | ||
1cd951c9 | 32 | use proxmox_backup::api2::types::Authid; |
a2ca7137 | 33 | use proxmox_backup::configdir; |
4a7de56e | 34 | use proxmox_backup::buildcfg; |
e3f41f21 | 35 | use proxmox_backup::server; |
d01e2420 | 36 | use proxmox_backup::auth_helpers::*; |
97168f92 | 37 | use proxmox_backup::tools::{ |
e4f5f59e | 38 | daemon, |
97168f92 DM |
39 | disks::{ |
40 | DiskManage, | |
41 | zfs_pool_stats, | |
42 | }, | |
fe4cc5b1 | 43 | logrotate::LogRotate, |
97168f92 DM |
44 | socket::{ |
45 | set_tcp_keepalive, | |
46 | PROXMOX_BACKUP_TCP_KEEPALIVE_TIME, | |
47 | }, | |
48 | }; | |
02c7a755 | 49 | |
a13573c2 | 50 | use proxmox_backup::api2::pull::do_sync_job; |
1298618a | 51 | use proxmox_backup::server::do_verification_job; |
b8d90798 | 52 | use proxmox_backup::server::do_prune_job; |
a13573c2 | 53 | |
946c3e8a | 54 | fn main() -> Result<(), Error> { |
ac7513e3 DM |
55 | proxmox_backup::tools::setup_safe_path_env(); |
56 | ||
843880f0 TL |
57 | let backup_uid = proxmox_backup::backup::backup_user()?.uid; |
58 | let backup_gid = proxmox_backup::backup::backup_group()?.gid; | |
59 | let running_uid = nix::unistd::Uid::effective(); | |
60 | let running_gid = nix::unistd::Gid::effective(); | |
61 | ||
62 | if running_uid != backup_uid || running_gid != backup_gid { | |
63 | bail!("proxy not running as backup user or group (got uid {} gid {})", running_uid, running_gid); | |
64 | } | |
65 | ||
946c3e8a | 66 | proxmox_backup::tools::runtime::main(run()) |
4223d9f8 DM |
67 | } |
68 | ||
fda5797b | 69 | async fn run() -> Result<(), Error> { |
02c7a755 DM |
70 | if let Err(err) = syslog::init( |
71 | syslog::Facility::LOG_DAEMON, | |
72 | log::LevelFilter::Info, | |
73 | Some("proxmox-backup-proxy")) { | |
4223d9f8 | 74 | bail!("unable to inititialize syslog - {}", err); |
02c7a755 DM |
75 | } |
76 | ||
e1d367df DM |
77 | // Note: To debug early connection error use |
78 | // PROXMOX_DEBUG=1 ./target/release/proxmox-backup-proxy | |
79 | let debug = std::env::var("PROXMOX_DEBUG").is_ok(); | |
80 | ||
d01e2420 DM |
81 | let _ = public_auth_key(); // load with lazy_static |
82 | let _ = csrf_secret(); // load with lazy_static | |
83 | ||
02c7a755 | 84 | let mut config = ApiConfig::new( |
f9e3b110 | 85 | buildcfg::JS_DIR, &proxmox_backup::api2::ROUTER, RpcEnvironmentType::PUBLIC)?; |
02c7a755 | 86 | |
02c7a755 DM |
87 | config.add_alias("novnc", "/usr/share/novnc-pve"); |
88 | config.add_alias("extjs", "/usr/share/javascript/extjs"); | |
89 | config.add_alias("fontawesome", "/usr/share/fonts-font-awesome"); | |
90 | config.add_alias("xtermjs", "/usr/share/pve-xtermjs"); | |
abd4c4cb | 91 | config.add_alias("locale", "/usr/share/pbs-i18n"); |
02c7a755 | 92 | config.add_alias("widgettoolkit", "/usr/share/javascript/proxmox-widget-toolkit"); |
9c01e73c | 93 | config.add_alias("docs", "/usr/share/doc/proxmox-backup/html"); |
02c7a755 | 94 | |
2ab5acac DC |
95 | let mut indexpath = PathBuf::from(buildcfg::JS_DIR); |
96 | indexpath.push("index.hbs"); | |
97 | config.register_template("index", &indexpath)?; | |
01ca99da | 98 | config.register_template("console", "/usr/share/pve-xtermjs/index.html.hbs")?; |
2ab5acac | 99 | |
a68768cf TL |
100 | let mut commando_sock = server::CommandoSocket::new(server::our_ctrl_sock()); |
101 | ||
fe4cc5b1 | 102 | config.enable_file_log(buildcfg::API_ACCESS_LOG_FN, &mut commando_sock)?; |
8e7e2223 | 103 | |
02c7a755 DM |
104 | let rest_server = RestServer::new(config); |
105 | ||
6d1f61b2 DM |
106 | //openssl req -x509 -newkey rsa:4096 -keyout /etc/proxmox-backup/proxy.key -out /etc/proxmox-backup/proxy.pem -nodes |
107 | let key_path = configdir!("/proxy.key"); | |
108 | let cert_path = configdir!("/proxy.pem"); | |
109 | ||
62c74d77 | 110 | let mut acceptor = SslAcceptor::mozilla_intermediate_v5(SslMethod::tls()).unwrap(); |
6d1f61b2 DM |
111 | acceptor.set_private_key_file(key_path, SslFiletype::PEM) |
112 | .map_err(|err| format_err!("unable to read proxy key {} - {}", key_path, err))?; | |
113 | acceptor.set_certificate_chain_file(cert_path) | |
114 | .map_err(|err| format_err!("unable to read proxy cert {} - {}", cert_path, err))?; | |
115 | acceptor.check_private_key().unwrap(); | |
116 | ||
117 | let acceptor = Arc::new(acceptor.build()); | |
0d176f36 | 118 | |
a690ecac WB |
119 | let server = daemon::create_daemon( |
120 | ([0,0,0,0,0,0,0,0], 8007).into(), | |
083ff3fd | 121 | |listener, ready| { |
97168f92 | 122 | |
e1d367df | 123 | let connections = accept_connections(listener, acceptor, debug); |
48aa2b93 | 124 | let connections = hyper::server::accept::from_stream(connections); |
083ff3fd WB |
125 | |
126 | Ok(ready | |
48aa2b93 | 127 | .and_then(|_| hyper::Server::builder(connections) |
083ff3fd WB |
128 | .serve(rest_server) |
129 | .with_graceful_shutdown(server::shutdown_future()) | |
130 | .map_err(Error::from) | |
131 | ) | |
132 | .map_err(|err| eprintln!("server error: {}", err)) | |
133 | .map(|_| ()) | |
a690ecac | 134 | ) |
a2ca7137 | 135 | }, |
d7c6ad60 | 136 | "proxmox-backup-proxy.service", |
083ff3fd | 137 | ); |
a2ca7137 | 138 | |
04b053d8 | 139 | server::write_pid(buildcfg::PROXMOX_BACKUP_PROXY_PID_FN)?; |
d98c9a7a WB |
140 | daemon::systemd_notify(daemon::SystemdNotify::Ready)?; |
141 | ||
fda5797b | 142 | let init_result: Result<(), Error> = try_block!({ |
a68768cf TL |
143 | server::register_task_control_commands(&mut commando_sock)?; |
144 | commando_sock.spawn()?; | |
fda5797b WB |
145 | server::server_state_init()?; |
146 | Ok(()) | |
147 | }); | |
d607b886 | 148 | |
fda5797b WB |
149 | if let Err(err) = init_result { |
150 | bail!("unable to start daemon - {}", err); | |
151 | } | |
e3f41f21 | 152 | |
8545480a | 153 | start_task_scheduler(); |
eaeda365 | 154 | start_stat_generator(); |
8545480a | 155 | |
083ff3fd | 156 | server.await?; |
a546a8a0 WB |
157 | log::info!("server shutting down, waiting for active workers to complete"); |
158 | proxmox_backup::server::last_worker_future().await?; | |
fda5797b | 159 | log::info!("done - exit server"); |
e3f41f21 | 160 | |
4223d9f8 | 161 | Ok(()) |
02c7a755 | 162 | } |
8545480a | 163 | |
48aa2b93 DM |
164 | fn accept_connections( |
165 | mut listener: tokio::net::TcpListener, | |
166 | acceptor: Arc<openssl::ssl::SslAcceptor>, | |
e1d367df | 167 | debug: bool, |
48aa2b93 DM |
168 | ) -> tokio::sync::mpsc::Receiver<Result<tokio_openssl::SslStream<tokio::net::TcpStream>, Error>> { |
169 | ||
ea93bea7 | 170 | const MAX_PENDING_ACCEPTS: usize = 1024; |
48aa2b93 | 171 | |
ea93bea7 | 172 | let (sender, receiver) = tokio::sync::mpsc::channel(MAX_PENDING_ACCEPTS); |
48aa2b93 | 173 | |
ea93bea7 | 174 | let accept_counter = Arc::new(()); |
48aa2b93 DM |
175 | |
176 | tokio::spawn(async move { | |
177 | loop { | |
178 | match listener.accept().await { | |
179 | Err(err) => { | |
180 | eprintln!("error accepting tcp connection: {}", err); | |
181 | } | |
182 | Ok((sock, _addr)) => { | |
183 | sock.set_nodelay(true).unwrap(); | |
184 | let _ = set_tcp_keepalive(sock.as_raw_fd(), PROXMOX_BACKUP_TCP_KEEPALIVE_TIME); | |
185 | let acceptor = Arc::clone(&acceptor); | |
186 | let mut sender = sender.clone(); | |
187 | ||
71f413cd | 188 | if Arc::strong_count(&accept_counter) > MAX_PENDING_ACCEPTS { |
ea93bea7 | 189 | eprintln!("connection rejected - to many open connections"); |
48aa2b93 DM |
190 | continue; |
191 | } | |
48aa2b93 DM |
192 | |
193 | let accept_counter = accept_counter.clone(); | |
194 | tokio::spawn(async move { | |
195 | let accept_future = tokio::time::timeout( | |
196 | Duration::new(10, 0), tokio_openssl::accept(&acceptor, sock)); | |
197 | ||
198 | let result = accept_future.await; | |
199 | ||
200 | match result { | |
201 | Ok(Ok(connection)) => { | |
202 | if let Err(_) = sender.send(Ok(connection)).await { | |
e1d367df DM |
203 | if debug { |
204 | eprintln!("detect closed connection channel"); | |
205 | } | |
48aa2b93 DM |
206 | } |
207 | } | |
208 | Ok(Err(err)) => { | |
e1d367df DM |
209 | if debug { |
210 | eprintln!("https handshake failed - {}", err); | |
211 | } | |
48aa2b93 DM |
212 | } |
213 | Err(_) => { | |
e1d367df DM |
214 | if debug { |
215 | eprintln!("https handshake timeout"); | |
216 | } | |
48aa2b93 DM |
217 | } |
218 | } | |
219 | ||
71f413cd | 220 | drop(accept_counter); // decrease reference count |
48aa2b93 DM |
221 | }); |
222 | } | |
223 | } | |
224 | } | |
225 | }); | |
226 | ||
227 | receiver | |
228 | } | |
229 | ||
eaeda365 DM |
230 | fn start_stat_generator() { |
231 | let abort_future = server::shutdown_future(); | |
232 | let future = Box::pin(run_stat_generator()); | |
233 | let task = futures::future::select(future, abort_future); | |
234 | tokio::spawn(task.map(|_| ())); | |
235 | } | |
236 | ||
8545480a DM |
237 | fn start_task_scheduler() { |
238 | let abort_future = server::shutdown_future(); | |
239 | let future = Box::pin(run_task_scheduler()); | |
240 | let task = futures::future::select(future, abort_future); | |
241 | tokio::spawn(task.map(|_| ())); | |
242 | } | |
243 | ||
6a7be83e | 244 | use std::time::{SystemTime, Instant, Duration, UNIX_EPOCH}; |
8545480a DM |
245 | |
246 | fn next_minute() -> Result<Instant, Error> { | |
6a7be83e DM |
247 | let now = SystemTime::now(); |
248 | let epoch_now = now.duration_since(UNIX_EPOCH)?; | |
249 | let epoch_next = Duration::from_secs((epoch_now.as_secs()/60 + 1)*60); | |
8545480a DM |
250 | Ok(Instant::now() + epoch_next - epoch_now) |
251 | } | |
252 | ||
253 | async fn run_task_scheduler() { | |
254 | ||
255 | let mut count: usize = 0; | |
256 | ||
257 | loop { | |
258 | count += 1; | |
259 | ||
260 | let delay_target = match next_minute() { // try to run very minute | |
261 | Ok(d) => d, | |
262 | Err(err) => { | |
263 | eprintln!("task scheduler: compute next minute failed - {}", err); | |
264 | tokio::time::delay_until(tokio::time::Instant::from_std(Instant::now() + Duration::from_secs(60))).await; | |
265 | continue; | |
266 | } | |
267 | }; | |
268 | ||
269 | if count > 2 { // wait 1..2 minutes before starting | |
270 | match schedule_tasks().catch_unwind().await { | |
271 | Err(panic) => { | |
272 | match panic.downcast::<&str>() { | |
273 | Ok(msg) => { | |
274 | eprintln!("task scheduler panic: {}", msg); | |
275 | } | |
276 | Err(_) => { | |
277 | eprintln!("task scheduler panic - unknown type"); | |
278 | } | |
279 | } | |
280 | } | |
281 | Ok(Err(err)) => { | |
282 | eprintln!("task scheduler failed - {:?}", err); | |
283 | } | |
284 | Ok(Ok(_)) => {} | |
285 | } | |
286 | } | |
287 | ||
288 | tokio::time::delay_until(tokio::time::Instant::from_std(delay_target)).await; | |
289 | } | |
290 | } | |
291 | ||
292 | async fn schedule_tasks() -> Result<(), Error> { | |
293 | ||
294 | schedule_datastore_garbage_collection().await; | |
25829a87 | 295 | schedule_datastore_prune().await; |
a6160cdf | 296 | schedule_datastore_sync_jobs().await; |
73df9c51 | 297 | schedule_datastore_verify_jobs().await; |
9a760917 | 298 | schedule_task_log_rotate().await; |
8545480a DM |
299 | |
300 | Ok(()) | |
301 | } | |
302 | ||
8545480a DM |
303 | async fn schedule_datastore_garbage_collection() { |
304 | ||
b9e7bcc2 DM |
305 | use proxmox_backup::config::{ |
306 | datastore::{ | |
307 | self, | |
308 | DataStoreConfig, | |
309 | }, | |
d7a122a0 | 310 | }; |
8545480a | 311 | |
25829a87 | 312 | let config = match datastore::config() { |
8545480a DM |
313 | Err(err) => { |
314 | eprintln!("unable to read datastore config - {}", err); | |
315 | return; | |
316 | } | |
317 | Ok((config, _digest)) => config, | |
318 | }; | |
319 | ||
320 | for (store, (_, store_config)) in config.sections { | |
321 | let datastore = match DataStore::lookup_datastore(&store) { | |
322 | Ok(datastore) => datastore, | |
323 | Err(err) => { | |
324 | eprintln!("lookup_datastore failed - {}", err); | |
325 | continue; | |
326 | } | |
327 | }; | |
328 | ||
25829a87 | 329 | let store_config: DataStoreConfig = match serde_json::from_value(store_config) { |
8545480a DM |
330 | Ok(c) => c, |
331 | Err(err) => { | |
332 | eprintln!("datastore config from_value failed - {}", err); | |
333 | continue; | |
334 | } | |
335 | }; | |
336 | ||
337 | let event_str = match store_config.gc_schedule { | |
338 | Some(event_str) => event_str, | |
339 | None => continue, | |
340 | }; | |
341 | ||
342 | let event = match parse_calendar_event(&event_str) { | |
343 | Ok(event) => event, | |
344 | Err(err) => { | |
345 | eprintln!("unable to parse schedule '{}' - {}", event_str, err); | |
346 | continue; | |
347 | } | |
348 | }; | |
349 | ||
350 | if datastore.garbage_collection_running() { continue; } | |
351 | ||
352 | let worker_type = "garbage_collection"; | |
353 | ||
b6ba5acd DC |
354 | let last = match jobstate::last_run_time(worker_type, &store) { |
355 | Ok(time) => time, | |
356 | Err(err) => { | |
357 | eprintln!("could not get last run time of {} {}: {}", worker_type, store, err); | |
358 | continue; | |
8545480a DM |
359 | } |
360 | }; | |
361 | ||
362 | let next = match compute_next_event(&event, last, false) { | |
15ec790a DC |
363 | Ok(Some(next)) => next, |
364 | Ok(None) => continue, | |
8545480a DM |
365 | Err(err) => { |
366 | eprintln!("compute_next_event for '{}' failed - {}", event_str, err); | |
367 | continue; | |
368 | } | |
369 | }; | |
e693818a | 370 | |
6a7be83e DM |
371 | let now = proxmox::tools::time::epoch_i64(); |
372 | ||
8545480a DM |
373 | if next > now { continue; } |
374 | ||
1cd951c9 | 375 | let job = match Job::new(worker_type, &store) { |
d7a122a0 DC |
376 | Ok(job) => job, |
377 | Err(_) => continue, // could not get lock | |
378 | }; | |
379 | ||
ad54df31 | 380 | let auth_id = Authid::root_auth_id(); |
d7a122a0 | 381 | |
c724f658 | 382 | if let Err(err) = crate::server::do_garbage_collection_job(job, datastore, auth_id, Some(event_str), false) { |
3b707fbb | 383 | eprintln!("unable to start garbage collection job on datastore {} - {}", store, err); |
8545480a DM |
384 | } |
385 | } | |
386 | } | |
25829a87 DM |
387 | |
388 | async fn schedule_datastore_prune() { | |
389 | ||
1298618a DM |
390 | use proxmox_backup::{ |
391 | backup::{ | |
392 | PruneOptions, | |
1298618a DM |
393 | }, |
394 | config::datastore::{ | |
395 | self, | |
396 | DataStoreConfig, | |
397 | }, | |
9866de5e | 398 | }; |
25829a87 DM |
399 | |
400 | let config = match datastore::config() { | |
401 | Err(err) => { | |
402 | eprintln!("unable to read datastore config - {}", err); | |
403 | return; | |
404 | } | |
405 | Ok((config, _digest)) => config, | |
406 | }; | |
407 | ||
408 | for (store, (_, store_config)) in config.sections { | |
25829a87 DM |
409 | |
410 | let store_config: DataStoreConfig = match serde_json::from_value(store_config) { | |
411 | Ok(c) => c, | |
412 | Err(err) => { | |
a6160cdf | 413 | eprintln!("datastore '{}' config from_value failed - {}", store, err); |
25829a87 DM |
414 | continue; |
415 | } | |
416 | }; | |
417 | ||
418 | let event_str = match store_config.prune_schedule { | |
419 | Some(event_str) => event_str, | |
420 | None => continue, | |
421 | }; | |
422 | ||
423 | let prune_options = PruneOptions { | |
424 | keep_last: store_config.keep_last, | |
425 | keep_hourly: store_config.keep_hourly, | |
426 | keep_daily: store_config.keep_daily, | |
427 | keep_weekly: store_config.keep_weekly, | |
428 | keep_monthly: store_config.keep_monthly, | |
429 | keep_yearly: store_config.keep_yearly, | |
430 | }; | |
431 | ||
432 | if !prune_options.keeps_something() { // no prune settings - keep all | |
433 | continue; | |
434 | } | |
435 | ||
25829a87 | 436 | let worker_type = "prune"; |
b15751bf | 437 | if check_schedule(worker_type, &event_str, &store) { |
82c05b41 HL |
438 | let job = match Job::new(worker_type, &store) { |
439 | Ok(job) => job, | |
440 | Err(_) => continue, // could not get lock | |
441 | }; | |
25829a87 | 442 | |
ad54df31 | 443 | let auth_id = Authid::root_auth_id().clone(); |
82c05b41 HL |
444 | if let Err(err) = do_prune_job(job, prune_options, store.clone(), &auth_id, Some(event_str)) { |
445 | eprintln!("unable to start datastore prune job {} - {}", &store, err); | |
25829a87 DM |
446 | } |
447 | }; | |
25829a87 DM |
448 | } |
449 | } | |
a6160cdf DM |
450 | |
451 | async fn schedule_datastore_sync_jobs() { | |
452 | ||
1298618a DM |
453 | use proxmox_backup::config::sync::{ |
454 | self, | |
455 | SyncJobConfig, | |
a6160cdf DM |
456 | }; |
457 | ||
458 | let config = match sync::config() { | |
459 | Err(err) => { | |
460 | eprintln!("unable to read sync job config - {}", err); | |
461 | return; | |
462 | } | |
463 | Ok((config, _digest)) => config, | |
464 | }; | |
465 | ||
a6160cdf DM |
466 | for (job_id, (_, job_config)) in config.sections { |
467 | let job_config: SyncJobConfig = match serde_json::from_value(job_config) { | |
468 | Ok(c) => c, | |
469 | Err(err) => { | |
470 | eprintln!("sync job config from_value failed - {}", err); | |
471 | continue; | |
472 | } | |
473 | }; | |
474 | ||
475 | let event_str = match job_config.schedule { | |
476 | Some(ref event_str) => event_str.clone(), | |
477 | None => continue, | |
478 | }; | |
479 | ||
c67b1fa7 | 480 | let worker_type = "syncjob"; |
b15751bf | 481 | if check_schedule(worker_type, &event_str, &job_id) { |
82c05b41 HL |
482 | let job = match Job::new(worker_type, &job_id) { |
483 | Ok(job) => job, | |
484 | Err(_) => continue, // could not get lock | |
485 | }; | |
a6160cdf | 486 | |
ad54df31 | 487 | let auth_id = Authid::root_auth_id().clone(); |
82c05b41 HL |
488 | if let Err(err) = do_sync_job(job, job_config, &auth_id, Some(event_str)) { |
489 | eprintln!("unable to start datastore sync job {} - {}", &job_id, err); | |
a6160cdf DM |
490 | } |
491 | }; | |
a6160cdf DM |
492 | } |
493 | } | |
eaeda365 | 494 | |
73df9c51 | 495 | async fn schedule_datastore_verify_jobs() { |
1298618a DM |
496 | |
497 | use proxmox_backup::config::verify::{ | |
498 | self, | |
499 | VerificationJobConfig, | |
73df9c51 | 500 | }; |
1298618a | 501 | |
73df9c51 HL |
502 | let config = match verify::config() { |
503 | Err(err) => { | |
504 | eprintln!("unable to read verification job config - {}", err); | |
505 | return; | |
506 | } | |
507 | Ok((config, _digest)) => config, | |
508 | }; | |
509 | for (job_id, (_, job_config)) in config.sections { | |
510 | let job_config: VerificationJobConfig = match serde_json::from_value(job_config) { | |
511 | Ok(c) => c, | |
512 | Err(err) => { | |
513 | eprintln!("verification job config from_value failed - {}", err); | |
514 | continue; | |
515 | } | |
516 | }; | |
517 | let event_str = match job_config.schedule { | |
518 | Some(ref event_str) => event_str.clone(), | |
519 | None => continue, | |
520 | }; | |
82c05b41 | 521 | |
73df9c51 | 522 | let worker_type = "verificationjob"; |
ad54df31 | 523 | let auth_id = Authid::root_auth_id().clone(); |
b15751bf | 524 | if check_schedule(worker_type, &event_str, &job_id) { |
82c05b41 HL |
525 | let job = match Job::new(&worker_type, &job_id) { |
526 | Ok(job) => job, | |
527 | Err(_) => continue, // could not get lock | |
528 | }; | |
529 | if let Err(err) = do_verification_job(job, job_config, &auth_id, Some(event_str)) { | |
530 | eprintln!("unable to start datastore verification job {} - {}", &job_id, err); | |
73df9c51 HL |
531 | } |
532 | }; | |
73df9c51 HL |
533 | } |
534 | } | |
535 | ||
9a760917 | 536 | async fn schedule_task_log_rotate() { |
9a760917 DC |
537 | |
538 | let worker_type = "logrotate"; | |
72aa1834 | 539 | let job_id = "access-log_and_task-archive"; |
9a760917 | 540 | |
9a760917 DC |
541 | // schedule daily at 00:00 like normal logrotate |
542 | let schedule = "00:00"; | |
543 | ||
b15751bf | 544 | if !check_schedule(worker_type, schedule, job_id) { |
9a760917 DC |
545 | // if we never ran the rotation, schedule instantly |
546 | match jobstate::JobState::load(worker_type, job_id) { | |
547 | Ok(state) => match state { | |
548 | jobstate::JobState::Created { .. } => {}, | |
549 | _ => return, | |
550 | }, | |
551 | _ => return, | |
552 | } | |
553 | } | |
554 | ||
555 | let mut job = match Job::new(worker_type, job_id) { | |
556 | Ok(job) => job, | |
557 | Err(_) => return, // could not get lock | |
558 | }; | |
559 | ||
560 | if let Err(err) = WorkerTask::new_thread( | |
561 | worker_type, | |
72aa1834 | 562 | None, |
ad54df31 | 563 | Authid::root_auth_id().clone(), |
9a760917 DC |
564 | false, |
565 | move |worker| { | |
566 | job.start(&worker.upid().to_string())?; | |
567 | worker.log(format!("starting task log rotation")); | |
e4f5f59e | 568 | |
9a760917 | 569 | let result = try_block!({ |
b7f2be51 TL |
570 | let max_size = 512 * 1024 - 1; // an entry has ~ 100b, so > 5000 entries/file |
571 | let max_files = 20; // times twenty files gives > 100000 task entries | |
9a760917 DC |
572 | let has_rotated = rotate_task_log_archive(max_size, true, Some(max_files))?; |
573 | if has_rotated { | |
574 | worker.log(format!("task log archive was rotated")); | |
575 | } else { | |
576 | worker.log(format!("task log archive was not rotated")); | |
577 | } | |
578 | ||
fe4cc5b1 TL |
579 | let max_size = 32 * 1024 * 1024 - 1; |
580 | let max_files = 14; | |
581 | let mut logrotate = LogRotate::new(buildcfg::API_ACCESS_LOG_FN, true) | |
582 | .ok_or_else(|| format_err!("could not get API access log file names"))?; | |
583 | ||
fe7bdc9d | 584 | if logrotate.rotate(max_size, None, Some(max_files))? { |
fe4cc5b1 TL |
585 | println!("rotated access log, telling daemons to re-open log file"); |
586 | proxmox_backup::tools::runtime::block_on(command_reopen_logfiles())?; | |
fe7bdc9d TL |
587 | worker.log(format!("API access log was rotated")); |
588 | } else { | |
589 | worker.log(format!("API access log was not rotated")); | |
590 | } | |
591 | ||
592 | let mut logrotate = LogRotate::new(buildcfg::API_AUTH_LOG_FN, true) | |
593 | .ok_or_else(|| format_err!("could not get API auth log file names"))?; | |
fe4cc5b1 | 594 | |
fe7bdc9d | 595 | if logrotate.rotate(max_size, None, Some(max_files))? { |
0eb0c4bd | 596 | worker.log(format!("API authentication log was rotated")); |
fe4cc5b1 | 597 | } else { |
0eb0c4bd | 598 | worker.log(format!("API authentication log was not rotated")); |
fe4cc5b1 TL |
599 | } |
600 | ||
9a760917 DC |
601 | Ok(()) |
602 | }); | |
603 | ||
604 | let status = worker.create_state(&result); | |
605 | ||
606 | if let Err(err) = job.finish(status) { | |
607 | eprintln!("could not finish job state for {}: {}", worker_type, err); | |
608 | } | |
609 | ||
610 | result | |
611 | }, | |
612 | ) { | |
613 | eprintln!("unable to start task log rotation: {}", err); | |
614 | } | |
615 | ||
616 | } | |
617 | ||
fe4cc5b1 TL |
618 | async fn command_reopen_logfiles() -> Result<(), Error> { |
619 | // only care about the most recent daemon instance for each, proxy & api, as other older ones | |
620 | // should not respond to new requests anyway, but only finish their current one and then exit. | |
621 | let sock = server::our_ctrl_sock(); | |
546b6a23 | 622 | let f1 = server::send_command(sock, serde_json::json!({ |
fe4cc5b1 | 623 | "command": "api-access-log-reopen", |
546b6a23 | 624 | })); |
fe4cc5b1 TL |
625 | |
626 | let pid = server::read_pid(buildcfg::PROXMOX_BACKUP_API_PID_FN)?; | |
627 | let sock = server::ctrl_sock_from_pid(pid); | |
546b6a23 | 628 | let f2 = server::send_command(sock, serde_json::json!({ |
fe4cc5b1 | 629 | "command": "api-access-log-reopen", |
546b6a23 TL |
630 | })); |
631 | ||
632 | match futures::join!(f1, f2) { | |
633 | (Err(e1), Err(e2)) => Err(format_err!("reopen commands failed, proxy: {}; api: {}", e1, e2)), | |
634 | (Err(e1), Ok(_)) => Err(format_err!("reopen commands failed, proxy: {}", e1)), | |
635 | (Ok(_), Err(e2)) => Err(format_err!("reopen commands failed, api: {}", e2)), | |
636 | _ => Ok(()), | |
637 | } | |
fe4cc5b1 TL |
638 | } |
639 | ||
eaeda365 DM |
640 | async fn run_stat_generator() { |
641 | ||
013fa7bb | 642 | let mut count = 0; |
eaeda365 | 643 | loop { |
013fa7bb | 644 | count += 1; |
a720894f | 645 | let save = if count >= 6 { count = 0; true } else { false }; |
013fa7bb | 646 | |
eaeda365 DM |
647 | let delay_target = Instant::now() + Duration::from_secs(10); |
648 | ||
013fa7bb | 649 | generate_host_stats(save).await; |
eaeda365 DM |
650 | |
651 | tokio::time::delay_until(tokio::time::Instant::from_std(delay_target)).await; | |
013fa7bb DM |
652 | |
653 | } | |
eaeda365 DM |
654 | |
655 | } | |
656 | ||
013fa7bb | 657 | fn rrd_update_gauge(name: &str, value: f64, save: bool) { |
309ef20d | 658 | use proxmox_backup::rrd; |
013fa7bb | 659 | if let Err(err) = rrd::update_value(name, value, rrd::DST::Gauge, save) { |
309ef20d DM |
660 | eprintln!("rrd::update_value '{}' failed - {}", name, err); |
661 | } | |
662 | } | |
663 | ||
013fa7bb | 664 | fn rrd_update_derive(name: &str, value: f64, save: bool) { |
309ef20d | 665 | use proxmox_backup::rrd; |
013fa7bb | 666 | if let Err(err) = rrd::update_value(name, value, rrd::DST::Derive, save) { |
309ef20d DM |
667 | eprintln!("rrd::update_value '{}' failed - {}", name, err); |
668 | } | |
669 | } | |
670 | ||
013fa7bb | 671 | async fn generate_host_stats(save: bool) { |
8f0cec26 | 672 | use proxmox::sys::linux::procfs::{ |
485841da | 673 | read_meminfo, read_proc_stat, read_proc_net_dev, read_loadavg}; |
309ef20d | 674 | use proxmox_backup::config::datastore; |
8c03041a | 675 | |
eaeda365 | 676 | |
4f951399 DM |
677 | proxmox_backup::tools::runtime::block_in_place(move || { |
678 | ||
679 | match read_proc_stat() { | |
680 | Ok(stat) => { | |
013fa7bb DM |
681 | rrd_update_gauge("host/cpu", stat.cpu, save); |
682 | rrd_update_gauge("host/iowait", stat.iowait_percent, save); | |
4f951399 DM |
683 | } |
684 | Err(err) => { | |
685 | eprintln!("read_proc_stat failed - {}", err); | |
eaeda365 DM |
686 | } |
687 | } | |
2c66a590 | 688 | |
4f951399 DM |
689 | match read_meminfo() { |
690 | Ok(meminfo) => { | |
013fa7bb DM |
691 | rrd_update_gauge("host/memtotal", meminfo.memtotal as f64, save); |
692 | rrd_update_gauge("host/memused", meminfo.memused as f64, save); | |
693 | rrd_update_gauge("host/swaptotal", meminfo.swaptotal as f64, save); | |
694 | rrd_update_gauge("host/swapused", meminfo.swapused as f64, save); | |
a4a3f7ca | 695 | } |
4f951399 DM |
696 | Err(err) => { |
697 | eprintln!("read_meminfo failed - {}", err); | |
a4a3f7ca DM |
698 | } |
699 | } | |
8f0cec26 | 700 | |
4f951399 DM |
701 | match read_proc_net_dev() { |
702 | Ok(netdev) => { | |
703 | use proxmox_backup::config::network::is_physical_nic; | |
704 | let mut netin = 0; | |
705 | let mut netout = 0; | |
706 | for item in netdev { | |
707 | if !is_physical_nic(&item.device) { continue; } | |
708 | netin += item.receive; | |
709 | netout += item.send; | |
710 | } | |
013fa7bb DM |
711 | rrd_update_derive("host/netin", netin as f64, save); |
712 | rrd_update_derive("host/netout", netout as f64, save); | |
8f0cec26 | 713 | } |
4f951399 DM |
714 | Err(err) => { |
715 | eprintln!("read_prox_net_dev failed - {}", err); | |
8f0cec26 DM |
716 | } |
717 | } | |
dd15c0aa | 718 | |
485841da DM |
719 | match read_loadavg() { |
720 | Ok(loadavg) => { | |
013fa7bb | 721 | rrd_update_gauge("host/loadavg", loadavg.0 as f64, save); |
485841da DM |
722 | } |
723 | Err(err) => { | |
724 | eprintln!("read_loadavg failed - {}", err); | |
725 | } | |
726 | } | |
727 | ||
8c03041a DM |
728 | let disk_manager = DiskManage::new(); |
729 | ||
013fa7bb | 730 | gather_disk_stats(disk_manager.clone(), Path::new("/"), "host", save); |
91e5bb49 | 731 | |
d0833a70 DM |
732 | match datastore::config() { |
733 | Ok((config, _)) => { | |
734 | let datastore_list: Vec<datastore::DataStoreConfig> = | |
735 | config.convert_to_typed_array("datastore").unwrap_or(Vec::new()); | |
736 | ||
737 | for config in datastore_list { | |
8c03041a | 738 | |
91e5bb49 | 739 | let rrd_prefix = format!("datastore/{}", config.name); |
8c03041a | 740 | let path = std::path::Path::new(&config.path); |
013fa7bb | 741 | gather_disk_stats(disk_manager.clone(), path, &rrd_prefix, save); |
d0833a70 DM |
742 | } |
743 | } | |
744 | Err(err) => { | |
745 | eprintln!("read datastore config failed - {}", err); | |
746 | } | |
747 | } | |
748 | ||
4f951399 | 749 | }); |
eaeda365 | 750 | } |
dd15c0aa | 751 | |
b15751bf DM |
752 | fn check_schedule(worker_type: &str, event_str: &str, id: &str) -> bool { |
753 | let event = match parse_calendar_event(event_str) { | |
82c05b41 HL |
754 | Ok(event) => event, |
755 | Err(err) => { | |
756 | eprintln!("unable to parse schedule '{}' - {}", event_str, err); | |
757 | return false; | |
758 | } | |
759 | }; | |
760 | ||
b15751bf | 761 | let last = match jobstate::last_run_time(worker_type, &id) { |
82c05b41 HL |
762 | Ok(time) => time, |
763 | Err(err) => { | |
764 | eprintln!("could not get last run time of {} {}: {}", worker_type, id, err); | |
765 | return false; | |
766 | } | |
767 | }; | |
768 | ||
769 | let next = match compute_next_event(&event, last, false) { | |
770 | Ok(Some(next)) => next, | |
771 | Ok(None) => return false, | |
772 | Err(err) => { | |
773 | eprintln!("compute_next_event for '{}' failed - {}", event_str, err); | |
774 | return false; | |
775 | } | |
776 | }; | |
777 | ||
778 | let now = proxmox::tools::time::epoch_i64(); | |
779 | next <= now | |
780 | } | |
781 | ||
013fa7bb | 782 | fn gather_disk_stats(disk_manager: Arc<DiskManage>, path: &Path, rrd_prefix: &str, save: bool) { |
91e5bb49 | 783 | |
934f5bb8 | 784 | match proxmox_backup::tools::disks::disk_usage(path) { |
33070956 | 785 | Ok(status) => { |
91e5bb49 | 786 | let rrd_key = format!("{}/total", rrd_prefix); |
33070956 | 787 | rrd_update_gauge(&rrd_key, status.total as f64, save); |
91e5bb49 | 788 | let rrd_key = format!("{}/used", rrd_prefix); |
33070956 | 789 | rrd_update_gauge(&rrd_key, status.used as f64, save); |
91e5bb49 DM |
790 | } |
791 | Err(err) => { | |
792 | eprintln!("read disk_usage on {:?} failed - {}", path, err); | |
793 | } | |
794 | } | |
795 | ||
934f5bb8 DM |
796 | match disk_manager.find_mounted_device(path) { |
797 | Ok(None) => {}, | |
798 | Ok(Some((fs_type, device, source))) => { | |
799 | let mut device_stat = None; | |
800 | match fs_type.as_str() { | |
801 | "zfs" => { | |
802 | if let Some(pool) = source { | |
803 | match zfs_pool_stats(&pool) { | |
804 | Ok(stat) => device_stat = stat, | |
805 | Err(err) => eprintln!("zfs_pool_stats({:?}) failed - {}", pool, err), | |
91e5bb49 DM |
806 | } |
807 | } | |
934f5bb8 DM |
808 | } |
809 | _ => { | |
810 | if let Ok(disk) = disk_manager.clone().disk_by_dev_num(device.into_dev_t()) { | |
811 | match disk.read_stat() { | |
812 | Ok(stat) => device_stat = stat, | |
813 | Err(err) => eprintln!("disk.read_stat {:?} failed - {}", path, err), | |
91e5bb49 DM |
814 | } |
815 | } | |
816 | } | |
91e5bb49 | 817 | } |
934f5bb8 DM |
818 | if let Some(stat) = device_stat { |
819 | let rrd_key = format!("{}/read_ios", rrd_prefix); | |
820 | rrd_update_derive(&rrd_key, stat.read_ios as f64, save); | |
821 | let rrd_key = format!("{}/read_bytes", rrd_prefix); | |
822 | rrd_update_derive(&rrd_key, (stat.read_sectors*512) as f64, save); | |
dd15c0aa | 823 | |
934f5bb8 DM |
824 | let rrd_key = format!("{}/write_ios", rrd_prefix); |
825 | rrd_update_derive(&rrd_key, stat.write_ios as f64, save); | |
826 | let rrd_key = format!("{}/write_bytes", rrd_prefix); | |
827 | rrd_update_derive(&rrd_key, (stat.write_sectors*512) as f64, save); | |
dd15c0aa | 828 | |
934f5bb8 DM |
829 | let rrd_key = format!("{}/io_ticks", rrd_prefix); |
830 | rrd_update_derive(&rrd_key, (stat.io_ticks as f64)/1000.0, save); | |
8c03041a DM |
831 | } |
832 | } | |
934f5bb8 DM |
833 | Err(err) => { |
834 | eprintln!("find_mounted_device failed - {}", err); | |
835 | } | |
8c03041a | 836 | } |
8c03041a | 837 | } |