/*****************************************************************************\
* job_report_functions.c - Interface to functions dealing with job reports.
******************************************************************************
* Copyright (C) 2010 Lawrence Livermore National Security.
* Produced at Lawrence Livermore National Laboratory (cf, DISCLAIMER).
* Written by Danny Auble da@llnl.gov, et. al.
* CODE-OCEC-09-009. All rights reserved.
*
* This file is part of Slurm, a resource management program.
* For details, see .
* Please also read the included file: DISCLAIMER.
*
* Slurm is free software; you can redistribute it and/or modify it under
* the terms of the GNU General Public License as published by the Free
* Software Foundation; either version 2 of the License, or (at your option)
* any later version.
*
* In addition, as a special exception, the copyright holders give permission
* to link the code of portions of this program with the OpenSSL library under
* certain conditions as described in each individual source file, and
* distribute linked combinations including the two. You must obey the GNU
* General Public License in all respects for all of the code used other than
* OpenSSL. If you modify file(s) with this exception, you may extend this
* exception to your version of the file(s), but you are not obligated to do
* so. If you do not wish to do so, delete this exception statement from your
* version. If you delete this exception statement from all source files in
* the program, then also delete it here.
*
* Slurm is distributed in the hope that it will be useful, but WITHOUT ANY
* WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
* FOR A PARTICULAR PURPOSE. See the GNU General Public License for more
* details.
*
* You should have received a copy of the GNU General Public License along
* with Slurm; if not, write to the Free Software Foundation, Inc.,
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
\*****************************************************************************/
#include
#include "slurm/slurm.h"
#include "slurm/slurm_errno.h"
#include "slurm/slurmdb.h"
#include "src/common/slurm_accounting_storage.h"
#include "src/common/xstring.h"
static int _sort_group_asc(void *v1, void *v2)
{
char *group_a = *(char **)v1;
char *group_b = *(char **)v2;
int size_a = atoi(group_a);
int size_b = atoi(group_b);
if (size_a < size_b)
return -1;
else if (size_a > size_b)
return 1;
return 0;
}
static void _check_create_grouping(
List cluster_list, ListIterator group_itr,
char *cluster, char *name, void *object,
bool individual, bool wckey_type)
{
ListIterator itr;
slurmdb_wckey_rec_t *wckey = (slurmdb_wckey_rec_t *)object;
slurmdb_assoc_rec_t *assoc = (slurmdb_assoc_rec_t *)object;
slurmdb_report_cluster_grouping_t *cluster_group = NULL;
slurmdb_report_acct_grouping_t *acct_group = NULL;
slurmdb_report_job_grouping_t *job_group = NULL;
itr = list_iterator_create(cluster_list);
while((cluster_group = list_next(itr))) {
if (!xstrcmp(cluster, cluster_group->cluster))
break;
}
list_iterator_destroy(itr);
if (!cluster_group) {
cluster_group = xmalloc(
sizeof(slurmdb_report_cluster_grouping_t));
cluster_group->cluster = xstrdup(cluster);
cluster_group->acct_list = list_create(
slurmdb_destroy_report_acct_grouping);
list_append(cluster_list, cluster_group);
}
itr = list_iterator_create(cluster_group->acct_list);
while ((acct_group = list_next(itr))) {
if (!xstrcmp(name, acct_group->acct))
break;
}
list_iterator_destroy(itr);
if (!acct_group) {
uint32_t last_size = 0;
char *group = NULL;
acct_group = xmalloc(sizeof(slurmdb_report_acct_grouping_t));
acct_group->acct = xstrdup(name);
if (wckey_type)
acct_group->lft = wckey->id;
else {
acct_group->lft = assoc->lft;
acct_group->rgt = assoc->rgt;
}
acct_group->groups = list_create(
slurmdb_destroy_report_job_grouping);
list_append(cluster_group->acct_list, acct_group);
while ((group = list_next(group_itr))) {
job_group = xmalloc(
sizeof(slurmdb_report_job_grouping_t));
job_group->jobs = list_create(NULL);
if (!individual)
job_group->min_size = last_size;
last_size = atoi(group);
if (!individual)
job_group->max_size = last_size-1;
else
job_group->min_size =
job_group->max_size = last_size;
list_append(acct_group->groups, job_group);
}
if (last_size && !individual) {
job_group = xmalloc(
sizeof(slurmdb_report_job_grouping_t));
job_group->jobs = list_create(NULL);
job_group->min_size = last_size;
job_group->max_size = INFINITE;
list_append(acct_group->groups, job_group);
}
list_iterator_reset(group_itr);
}
}
/* FIXME: This only works for CPUS now */
static List _process_grouped_report(
void *db_conn, slurmdb_job_cond_t *job_cond, List grouping_list,
bool flat_view, bool wckey_type, bool both, bool acct_as_parent)
{
int exit_code = 0;
void *object = NULL, *object2 = NULL;
ListIterator itr = NULL, itr2 = NULL;
ListIterator cluster_itr = NULL;
ListIterator local_itr = NULL;
ListIterator acct_itr = NULL;
ListIterator group_itr = NULL;
slurmdb_job_rec_t *job = NULL;
slurmdb_report_cluster_grouping_t *cluster_group = NULL;
slurmdb_report_acct_grouping_t *acct_group = NULL;
slurmdb_report_job_grouping_t *job_group = NULL;
List job_list = NULL;
List cluster_list = NULL;
List object_list = NULL, object2_list = NULL;
List tmp_acct_list = NULL;
bool destroy_job_cond = 0;
bool destroy_grouping_list = 0;
bool individual = 0;
uint32_t tres_id = TRES_CPU;
uid_t my_uid = getuid();
/* we don't want to actually query by accounts in the jobs
here since we may be looking for sub accounts of a specific
account.
*/
if (!job_cond) {
destroy_job_cond = 1;
job_cond = xmalloc(sizeof(slurmdb_job_cond_t));
}
if (!grouping_list) {
destroy_grouping_list = 1;
grouping_list = list_create(xfree_ptr);
slurm_addto_char_list(grouping_list, "50,250,500,1000");
}
if (!flat_view) {
tmp_acct_list = job_cond->acct_list;
job_cond->acct_list = NULL;
}
job_cond->flags |= JOBCOND_FLAG_DUP;
job_cond->db_flags = SLURMDB_JOB_FLAG_NOTSET;
job_list = jobacct_storage_g_get_jobs_cond(db_conn, my_uid, job_cond);
if (!flat_view) {
job_cond->acct_list = tmp_acct_list;
tmp_acct_list = NULL;
}
if (!job_list) {
exit_code=1;
fprintf(stderr, " Problem with job query.\n");
goto end_it;
}
group_itr = list_iterator_create(grouping_list);
/* make a group for each job size we find. */
if (!list_count(grouping_list)) {
char *group = NULL;
individual = 1;
itr = list_iterator_create(job_list);
while ((job = list_next(itr))) {
char *tmp = NULL;
uint64_t count;
if (!job->elapsed)
continue;
if ((count = slurmdb_find_tres_count_in_string(
job->tres_alloc_str, tres_id))
== INFINITE64)
continue;
tmp = xstrdup_printf("%"PRIu64, count);
while ((group = list_next(group_itr))) {
if (!xstrcmp(group, tmp)) {
break;
}
}
if (!group)
list_append(grouping_list, tmp);
else
xfree(tmp);
list_iterator_reset(group_itr);
}
list_iterator_destroy(itr);
list_sort(grouping_list, (ListCmpF)_sort_group_asc);
}
cluster_list = list_create(slurmdb_destroy_report_cluster_grouping);
cluster_itr = list_iterator_create(cluster_list);
if (flat_view)
goto no_objects;
if (!wckey_type || both) {
slurmdb_assoc_cond_t assoc_cond;
memset(&assoc_cond, 0, sizeof(slurmdb_assoc_cond_t));
assoc_cond.id_list = job_cond->associd_list;
assoc_cond.cluster_list = job_cond->cluster_list;
/* don't limit associations to having the partition_list */
//assoc_cond.partition_list = job_cond->partition_list;
if (acct_as_parent) {
/*
* Behave like an 'ls', will ask for the subaccounts of
* the requested account.
*/
if (!job_cond->acct_list ||
!list_count(job_cond->acct_list)) {
FREE_NULL_LIST(job_cond->acct_list);
job_cond->acct_list = list_create(NULL);
list_append(job_cond->acct_list, "root");
assoc_cond.parent_acct_list =
job_cond->acct_list;
} else {
assoc_cond.parent_acct_list =
job_cond->acct_list;
}
} else {
/* Ask strictly for these accounts. */
if (job_cond->acct_list &&
list_count(job_cond->acct_list))
assoc_cond.acct_list = job_cond->acct_list;
}
object_list = acct_storage_g_get_assocs(db_conn, my_uid,
&assoc_cond);
}
if (wckey_type || both) {
slurmdb_wckey_cond_t wckey_cond;
memset(&wckey_cond, 0, sizeof(slurmdb_wckey_cond_t));
wckey_cond.name_list = job_cond->wckey_list;
wckey_cond.cluster_list = job_cond->cluster_list;
object2_list = acct_storage_g_get_wckeys(db_conn, my_uid,
&wckey_cond);
if (!object_list) {
object_list = object2_list;
object2_list = NULL;
}
}
if (!object_list) {
debug2(" No join list given.\n");
goto no_objects;
}
itr = list_iterator_create(object_list);
if (object2_list)
itr2 = list_iterator_create(object2_list);
while ((object = list_next(itr))) {
char *cluster = NULL;
slurmdb_wckey_rec_t *wckey = (slurmdb_wckey_rec_t *)object;
slurmdb_assoc_rec_t *assoc =
(slurmdb_assoc_rec_t *)object;
if (!itr2) {
char *name = NULL;
if (wckey_type) {
cluster = wckey->cluster;
name = wckey->name;
} else {
cluster = assoc->cluster;
name = assoc->acct;
}
_check_create_grouping(cluster_list, group_itr,
cluster, name, object,
individual, wckey_type);
continue;
}
while ((object2 = list_next(itr2))) {
slurmdb_wckey_rec_t *wckey2 =
(slurmdb_wckey_rec_t *)object2;
slurmdb_assoc_rec_t *assoc2 =
(slurmdb_assoc_rec_t *)object2;
char name[200];
if (!wckey_type) {
if (xstrcmp(assoc->cluster, wckey2->cluster))
continue;
cluster = assoc->cluster;
snprintf(name, sizeof(name), "%s:%s",
assoc->acct, wckey2->name);
} else {
if (xstrcmp(wckey->cluster, assoc2->cluster))
continue;
cluster = wckey->cluster;
snprintf(name, sizeof(name), "%s:%s",
wckey2->name, assoc->acct);
}
_check_create_grouping(cluster_list, group_itr,
cluster, name, object,
individual, wckey_type);
}
list_iterator_reset(itr2);
}
list_iterator_destroy(itr);
if (itr2)
list_iterator_destroy(itr2);
no_objects:
itr = list_iterator_create(job_list);
while((job = list_next(itr))) {
char *local_cluster = "UNKNOWN";
char tmp_acct[200];
if (!job->elapsed) {
/* here we don't care about jobs that didn't
* really run here */
continue;
}
if (job->cluster)
local_cluster = job->cluster;
if (!wckey_type) {
if (both && job->wckey) {
snprintf(tmp_acct, sizeof(tmp_acct),
"%s:%s",
job->account,
job->wckey);
} else {
snprintf(tmp_acct, sizeof(tmp_acct),
"%s", job->account);
}
} else {
if (both && job->account) {
snprintf(tmp_acct, sizeof(tmp_acct),
"%s:%s",
job->wckey,
job->account);
} else {
snprintf(tmp_acct, sizeof(tmp_acct),
"%s", job->wckey);
}
}
list_iterator_reset(cluster_itr);
while((cluster_group = list_next(cluster_itr))) {
if (!xstrcmp(local_cluster, cluster_group->cluster))
break;
}
if (!cluster_group) {
/* here we are only looking for groups that
* were added with the associations above
*/
if (!flat_view)
continue;
cluster_group = xmalloc(
sizeof(slurmdb_report_cluster_grouping_t));
cluster_group->cluster = xstrdup(local_cluster);
cluster_group->acct_list = list_create(
slurmdb_destroy_report_acct_grouping);
list_append(cluster_list, cluster_group);
}
acct_itr = list_iterator_create(cluster_group->acct_list);
while((acct_group = list_next(acct_itr))) {
if (wckey_type) {
if (!xstrcmp(tmp_acct, acct_group->acct))
break;
continue;
}
if (!flat_view
&& (acct_group->lft != NO_VAL)
&& (job->lft != NO_VAL)) {
/* keep separate since we don't want
* to so a xstrcmp if we don't have to
*/
if (job->lft > acct_group->lft
&& job->lft < acct_group->rgt) {
char *mywckey = NULL;
if (!both)
break;
if (acct_group->acct) {
if ((mywckey = strstr(
acct_group->acct,
":")))
mywckey++;
}
if (!job->wckey && !mywckey)
break;
else if (!mywckey || !job->wckey)
continue;
else if (!xstrcmp(mywckey, job->wckey))
break;
}
} else if (!xstrcmp(acct_group->acct, tmp_acct))
break;
}
list_iterator_destroy(acct_itr);
if (!acct_group) {
char *group = NULL;
uint32_t last_size = 0;
/* here we are only looking for groups that
* were added with the associations above
*/
if (!flat_view)
continue;
acct_group = xmalloc(
sizeof(slurmdb_report_acct_grouping_t));
acct_group->acct = xstrdup(tmp_acct);
acct_group->groups = list_create(
slurmdb_destroy_report_job_grouping);
list_append(cluster_group->acct_list, acct_group);
while((group = list_next(group_itr))) {
job_group = xmalloc(
sizeof(slurmdb_report_job_grouping_t));
job_group->jobs = list_create(NULL);
if (!individual)
job_group->min_size = last_size;
last_size = atoi(group);
if (!individual)
job_group->max_size = last_size-1;
else
job_group->min_size =
job_group->max_size = last_size;
list_append(acct_group->groups, job_group);
}
if (last_size && !individual) {
job_group = xmalloc(
sizeof(slurmdb_report_job_grouping_t));
job_group->jobs = list_create(NULL);
job_group->min_size = last_size;
if (individual)
job_group->max_size =
job_group->min_size;
else
job_group->max_size = INFINITE;
list_append(acct_group->groups, job_group);
}
list_iterator_reset(group_itr);
}
local_itr = list_iterator_create(acct_group->groups);
while ((job_group = list_next(local_itr))) {
uint64_t count;
if (((count = slurmdb_find_tres_count_in_string(
job->tres_alloc_str, tres_id))
== INFINITE64) ||
(count < job_group->min_size) ||
(count > job_group->max_size))
continue;
list_append(job_group->jobs, job);
job_group->count++;
acct_group->count++;
cluster_group->count++;
slurmdb_transfer_tres_time(
&job_group->tres_list, job->tres_alloc_str,
job->elapsed);
slurmdb_transfer_tres_time(
&acct_group->tres_list, job->tres_alloc_str,
job->elapsed);
slurmdb_transfer_tres_time(
&cluster_group->tres_list, job->tres_alloc_str,
job->elapsed);
}
list_iterator_destroy(local_itr);
}
list_iterator_destroy(itr);
list_iterator_destroy(group_itr);
list_iterator_reset(cluster_itr);
while ((cluster_group = list_next(cluster_itr))) {
ListIterator acct_itr;
if (!cluster_group->count) {
list_delete_item(cluster_itr);
continue;
}
acct_itr = list_iterator_create(cluster_group->acct_list);
while ((acct_group = list_next(acct_itr))) {
if (!acct_group->count) {
list_delete_item(acct_itr);
continue;
}
}
list_iterator_destroy(acct_itr);
}
list_iterator_destroy(cluster_itr);
end_it:
FREE_NULL_LIST(object_list);
FREE_NULL_LIST(object2_list);
if (destroy_job_cond)
slurmdb_destroy_job_cond(job_cond);
if (destroy_grouping_list)
FREE_NULL_LIST(grouping_list);
if (exit_code) {
FREE_NULL_LIST(cluster_list);
}
return cluster_list;
}
extern List slurmdb_report_job_sizes_grouped_by_account(
void *db_conn, slurmdb_job_cond_t *job_cond, List grouping_list,
bool flat_view, bool acct_as_parent)
{
return _process_grouped_report(db_conn, job_cond, grouping_list,
flat_view, 0, 0, acct_as_parent);
}
extern List slurmdb_report_job_sizes_grouped_by_wckey(void *db_conn,
slurmdb_job_cond_t *job_cond, List grouping_list)
{
return _process_grouped_report(db_conn, job_cond, grouping_list,
0, 1, 0, false);
}
extern List slurmdb_report_job_sizes_grouped_by_account_then_wckey(
void *db_conn, slurmdb_job_cond_t *job_cond,
List grouping_list, bool flat_view, bool acct_as_parent)
{
return _process_grouped_report(db_conn, job_cond, grouping_list,
flat_view, 0, 1, acct_as_parent);
}