cctools
|
Statistics describing a work queue. More...
#include <work_queue.h>
Data Fields | |
int | total_workers_connected |
Total number of workers currently connected to the master. More... | |
int | workers_init |
Number of workers initializing. More... | |
int | workers_idle |
Number of workers that are not running a task. More... | |
int | workers_busy |
Number of workers that are running at least one task. More... | |
int | total_workers_joined |
Total number of worker connections that were established to the master. More... | |
int | total_workers_removed |
Total number of worker connections that were terminated by the master. More... | |
int | tasks_waiting |
Number of tasks waiting to be run. More... | |
int | tasks_running |
Number of tasks currently running. More... | |
int | tasks_complete |
Number of tasks waiting to be returned to user. More... | |
int | total_tasks_dispatched |
Total number of tasks dispatch to workers. More... | |
int | total_tasks_complete |
Total number of tasks completed and returned to user. More... | |
int | total_tasks_failed |
Total number of tasks completed and returned to user with result other than WQ_RESULT_SUCCESS. More... | |
int | total_tasks_cancelled |
Total number of tasks cancelled. More... | |
timestamp_t | start_time |
Absolute time at which the master started. More... | |
timestamp_t | total_send_time |
Total time in microseconds spent in sending data to workers. More... | |
timestamp_t | total_receive_time |
Total time in microseconds spent in receiving data from workers. More... | |
timestamp_t | total_good_transfer_time |
Total time in microseconds spent in sending and receiving data to workers for tasks with result WQ_RESULT_SUCCESS. More... | |
timestamp_t | total_execute_time |
Total time in microseconds workers spent executing completed tasks. More... | |
timestamp_t | total_good_execute_time |
Total time in microseconds workers spent executing successful tasks. More... | |
int64_t | total_bytes_sent |
Total number of file bytes (not including protocol control msg bytes) sent out to the workers by the master. More... | |
int64_t | total_bytes_received |
Total number of file bytes (not including protocol control msg bytes) received from the workers by the master. More... | |
double | efficiency |
Parallel efficiency of the system, sum(task execution times) / sum(worker lifetimes) More... | |
double | idle_percentage |
The fraction of time that the master is idle waiting for workers to respond. More... | |
int | capacity |
The estimated number of workers that this master can effectively support. More... | |
double | bandwidth |
Average network bandwidth in MB/S observed by the master when transferring to workers. More... | |
int64_t | total_cores |
Total number of cores aggregated across the connected workers. More... | |
int64_t | total_memory |
Total memory in MB aggregated across the connected workers. More... | |
int64_t | total_disk |
Total disk space in MB aggregated across the connected workers. More... | |
int64_t | total_gpus |
Total number of GPUs aggregated across the connected workers. More... | |
int64_t | committed_cores |
Committed number of cores aggregated across the connected workers. More... | |
int64_t | committed_memory |
Committed memory in MB aggregated across the connected workers. More... | |
int64_t | committed_disk |
Committed disk space in MB aggregated across the connected workers. More... | |
int64_t | committed_gpus |
Committed number of GPUs aggregated across the connected workers. More... | |
int64_t | min_cores |
The lowest number of cores observed among the connected workers. More... | |
int64_t | max_cores |
The highest number of cores observed among the connected workers. More... | |
int64_t | min_memory |
The smallest memory size in MB observed among the connected workers. More... | |
int64_t | max_memory |
The largest memory size in MB observed among the connected workers. More... | |
int64_t | min_disk |
The smallest disk space in MB observed among the connected workers. More... | |
int64_t | max_disk |
The largest disk space in MB observed among the connected workers. More... | |
int64_t | min_gpus |
The lowest number of GPUs observed among the connected workers. More... | |
int64_t | max_gpus |
The highest number of GPUs observed among the connected workers. More... | |
int | workers_ready |
int | workers_full |
int | total_worker_slots |
int | avg_capacity |
Statistics describing a work queue.
int work_queue_stats::total_workers_connected |
Total number of workers currently connected to the master.
int work_queue_stats::workers_init |
Number of workers initializing.
int work_queue_stats::workers_idle |
Number of workers that are not running a task.
int work_queue_stats::workers_busy |
Number of workers that are running at least one task.
int work_queue_stats::total_workers_joined |
Total number of worker connections that were established to the master.
int work_queue_stats::total_workers_removed |
Total number of worker connections that were terminated by the master.
int work_queue_stats::tasks_waiting |
Number of tasks waiting to be run.
int work_queue_stats::tasks_running |
Number of tasks currently running.
int work_queue_stats::tasks_complete |
Number of tasks waiting to be returned to user.
int work_queue_stats::total_tasks_dispatched |
Total number of tasks dispatch to workers.
int work_queue_stats::total_tasks_complete |
Total number of tasks completed and returned to user.
int work_queue_stats::total_tasks_failed |
Total number of tasks completed and returned to user with result other than WQ_RESULT_SUCCESS.
int work_queue_stats::total_tasks_cancelled |
Total number of tasks cancelled.
timestamp_t work_queue_stats::start_time |
Absolute time at which the master started.
timestamp_t work_queue_stats::total_send_time |
Total time in microseconds spent in sending data to workers.
timestamp_t work_queue_stats::total_receive_time |
Total time in microseconds spent in receiving data from workers.
timestamp_t work_queue_stats::total_good_transfer_time |
Total time in microseconds spent in sending and receiving data to workers for tasks with result WQ_RESULT_SUCCESS.
timestamp_t work_queue_stats::total_execute_time |
Total time in microseconds workers spent executing completed tasks.
timestamp_t work_queue_stats::total_good_execute_time |
Total time in microseconds workers spent executing successful tasks.
int64_t work_queue_stats::total_bytes_sent |
Total number of file bytes (not including protocol control msg bytes) sent out to the workers by the master.
int64_t work_queue_stats::total_bytes_received |
Total number of file bytes (not including protocol control msg bytes) received from the workers by the master.
double work_queue_stats::efficiency |
Parallel efficiency of the system, sum(task execution times) / sum(worker lifetimes)
double work_queue_stats::idle_percentage |
The fraction of time that the master is idle waiting for workers to respond.
int work_queue_stats::capacity |
The estimated number of workers that this master can effectively support.
double work_queue_stats::bandwidth |
Average network bandwidth in MB/S observed by the master when transferring to workers.
int64_t work_queue_stats::total_cores |
Total number of cores aggregated across the connected workers.
int64_t work_queue_stats::total_memory |
Total memory in MB aggregated across the connected workers.
int64_t work_queue_stats::total_disk |
Total disk space in MB aggregated across the connected workers.
int64_t work_queue_stats::total_gpus |
Total number of GPUs aggregated across the connected workers.
int64_t work_queue_stats::committed_cores |
Committed number of cores aggregated across the connected workers.
int64_t work_queue_stats::committed_memory |
Committed memory in MB aggregated across the connected workers.
int64_t work_queue_stats::committed_disk |
Committed disk space in MB aggregated across the connected workers.
int64_t work_queue_stats::committed_gpus |
Committed number of GPUs aggregated across the connected workers.
int64_t work_queue_stats::min_cores |
The lowest number of cores observed among the connected workers.
int64_t work_queue_stats::max_cores |
The highest number of cores observed among the connected workers.
int64_t work_queue_stats::min_memory |
The smallest memory size in MB observed among the connected workers.
int64_t work_queue_stats::max_memory |
The largest memory size in MB observed among the connected workers.
int64_t work_queue_stats::min_disk |
The smallest disk space in MB observed among the connected workers.
int64_t work_queue_stats::max_disk |
The largest disk space in MB observed among the connected workers.
int64_t work_queue_stats::min_gpus |
The lowest number of GPUs observed among the connected workers.
int64_t work_queue_stats::max_gpus |
The highest number of GPUs observed among the connected workers.
int work_queue_stats::workers_ready |
int work_queue_stats::workers_full |
int work_queue_stats::total_worker_slots |
int work_queue_stats::avg_capacity |