/*****************************************************************************\ * event_functions.c - functions dealing with events in the * accounting system. ***************************************************************************** * Copyright (C) 2008 Lawrence Livermore National Security. * Copyright (C) 2002-2007 The Regents of the University of California. * Produced at Lawrence Livermore National Laboratory (cf, DISCLAIMER). * Written by Danny Auble * CODE-OCEC-09-009. All rights reserved. * * This file is part of Slurm, a resource management program. * For details, see . * Please also read the included file: DISCLAIMER. * * Slurm is free software; you can redistribute it and/or modify it under * the terms of the GNU General Public License as published by the Free * Software Foundation; either version 2 of the License, or (at your option) * any later version. * * In addition, as a special exception, the copyright holders give permission * to link the code of portions of this program with the OpenSSL library under * certain conditions as described in each individual source file, and * distribute linked combinations including the two. You must obey the GNU * General Public License in all respects for all of the code used other than * OpenSSL. If you modify file(s) with this exception, you may extend this * exception to your version of the file(s), but you are not obligated to do * so. If you do not wish to do so, delete this exception statement from your * version. If you delete this exception statement from all source files in * the program, then also delete it here. * * Slurm is distributed in the hope that it will be useful, but WITHOUT ANY * WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS * FOR A PARTICULAR PURPOSE. See the GNU General Public License for more * details. * * You should have received a copy of the GNU General Public License along * with Slurm; if not, write to the Free Software Foundation, Inc., * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. \*****************************************************************************/ #include #include "src/common/slurm_time.h" #include "src/common/slurmdbd_defs.h" #include "src/common/uid.h" #include "src/sacctmgr/sacctmgr.h" static uint32_t _decode_node_state(char *val) { int vallen; xassert(val); vallen = strlen(val); if (!xstrncasecmp(val, "DRAIN", MAX(vallen, 3))) return NODE_STATE_DRAIN; else if (!xstrncasecmp(val, "FAIL", MAX(vallen, 3))) return NODE_STATE_FAIL; else if (!xstrncasecmp(val, "REBOOT", MAX(vallen, 3))) return NODE_STATE_REBOOT; else { uint32_t j; for (j = 0; j < NODE_STATE_END; j++) { if (xstrncasecmp(node_state_string(j), val, MAX(vallen, 3)) == 0){ return j; } } if (j == NODE_STATE_END) { exit_code = 1; fprintf(stderr, "Invalid state: %s\n", val); fprintf (stderr, "Valid node states are: "); fprintf (stderr, "DRAIN FAIL "); for (j = 0; j < NODE_STATE_END; j++) { fprintf (stderr, "%s ", node_state_string(j)); } fprintf (stderr, "\n"); } } return NO_VAL; } static int _addto_state_char_list(List char_list, char *names) { int i=0, start=0; uint32_t c; char *name = NULL, *tmp_char = NULL; ListIterator itr = NULL; char quote_c = '\0'; int quote = 0; int count = 0; if (!char_list) { error("No list was given to fill in"); return 0; } itr = list_iterator_create(char_list); if (names) { if (names[i] == '\"' || names[i] == '\'') { quote_c = names[i]; quote = 1; i++; } start = i; while(names[i]) { //info("got %d - %d = %d", i, start, i-start); if (quote && names[i] == quote_c) break; else if (names[i] == '\"' || names[i] == '\'') names[i] = '`'; else if (names[i] == ',') { if ((i-start) > 0) { name = xmalloc((i-start+1)); memcpy(name, names+start, (i-start)); c = _decode_node_state(name); if (c == NO_VAL) fatal("unrecognized job " "state value"); xfree(name); name = xstrdup_printf("%u", c); while((tmp_char = list_next(itr))) { if (!xstrcasecmp(tmp_char, name)) break; } if (!tmp_char) { list_append(char_list, name); count++; } else xfree(name); list_iterator_reset(itr); } i++; start = i; if (!names[i]) { info("There is a problem with " "your request. It appears you " "have spaces inside your list."); break; } } i++; } if ((i-start) > 0) { name = xmalloc((i-start)+1); memcpy(name, names+start, (i-start)); c = _decode_node_state(name); if (c == NO_VAL) fatal("unrecognized job state value"); xfree(name); name = xstrdup_printf("%u", c); while((tmp_char = list_next(itr))) { if (!xstrcasecmp(tmp_char, name)) break; } if (!tmp_char) { list_append(char_list, name); count++; } else xfree(name); } } list_iterator_destroy(itr); return count; } static char *_convert_to_id(char *name, bool gid) { if (gid) { gid_t gid; if ( gid_from_string( name, &gid ) != 0 ) { fprintf(stderr, "Invalid group id: %s\n", name); exit(1); } xfree(name); name = xstrdup_printf( "%d", (int) gid ); } else { uid_t uid; if ( uid_from_string( name, &uid ) != 0 ) { fprintf(stderr, "Invalid user id: %s\n", name); exit(1); } xfree(name); name = xstrdup_printf( "%d", (int) uid ); } return name; } /* returns number of objects added to list */ static int _addto_id_char_list(List char_list, char *names, bool gid) { int i=0, start=0; char *name = NULL, *tmp_char = NULL; ListIterator itr = NULL; char quote_c = '\0'; int quote = 0; int count = 0; if (!char_list) { error("No list was given to fill in"); return 0; } itr = list_iterator_create(char_list); if (names) { if (names[i] == '\"' || names[i] == '\'') { quote_c = names[i]; quote = 1; i++; } start = i; while(names[i]) { //info("got %d - %d = %d", i, start, i-start); if (quote && names[i] == quote_c) break; else if (names[i] == '\"' || names[i] == '\'') names[i] = '`'; else if (names[i] == ',') { if ((i-start) > 0) { name = xmalloc((i-start+1)); memcpy(name, names+start, (i-start)); //info("got %s %d", name, i-start); name = _convert_to_id( name, gid ); while((tmp_char = list_next(itr))) { if (!xstrcasecmp(tmp_char, name)) break; } if (!tmp_char) { list_append(char_list, name); count++; } else xfree(name); list_iterator_reset(itr); } i++; start = i; if (!names[i]) { info("There is a problem with " "your request. It appears you " "have spaces inside your list."); break; } } i++; } if ((i-start) > 0) { name = xmalloc((i-start)+1); memcpy(name, names+start, (i-start)); name = _convert_to_id(name, gid); while((tmp_char = list_next(itr))) { if (!xstrcasecmp(tmp_char, name)) break; } if (!tmp_char) { list_append(char_list, name); count++; } else xfree(name); } } list_iterator_destroy(itr); return count; } static int _set_cond(int *start, int argc, char **argv, slurmdb_event_cond_t *event_cond, List format_list) { int i, end = 0; int set = 0; int command_len = 0; int local_cluster_flag = 0; int all_time_flag = 0; if (!event_cond->cluster_list) event_cond->cluster_list = list_create(xfree_ptr); for (i=(*start); icluster_list) event_cond->cluster_list = list_create(xfree_ptr); if (slurm_addto_char_list(event_cond->cluster_list, argv[i]+end)) set = 1; } else if (!xstrncasecmp(argv[i], "End", MAX(command_len, 1))) { event_cond->period_end = parse_time(argv[i]+end, 1); set = 1; } else if (!xstrncasecmp(argv[i], "Format", MAX(command_len, 1))) { if (format_list) slurm_addto_char_list(format_list, argv[i]+end); } else if (!xstrncasecmp(argv[i], "MinCpus", MAX(command_len, 2))) { if (get_uint(argv[i]+end, &event_cond->cpus_min, "MinCpus") == SLURM_SUCCESS) set = 1; } else if (!xstrncasecmp(argv[i], "MaxCpus", MAX(command_len, 2))) { if (get_uint(argv[i]+end, &event_cond->cpus_max, "MaxCpus") == SLURM_SUCCESS) set = 1; } else if (!xstrncasecmp(argv[i], "Nodes", MAX(command_len, 1))) { xfree(event_cond->node_list); event_cond->node_list = xstrdup(argv[i]+end); set = 1; } else if (!xstrncasecmp(argv[i], "Reason", MAX(command_len, 1))) { if (!event_cond->reason_list) event_cond->reason_list = list_create(xfree_ptr); if (slurm_addto_char_list(event_cond->reason_list, argv[i]+end)) set = 1; } else if (!xstrncasecmp(argv[i], "Start", MAX(command_len, 4))) { event_cond->period_start = parse_time(argv[i]+end, 1); set = 1; } else if (!xstrncasecmp(argv[i], "States", MAX(command_len, 4))) { if (!event_cond->state_list) event_cond->state_list = list_create(xfree_ptr); if (_addto_state_char_list(event_cond->state_list, argv[i]+end)) { event_cond->event_type = SLURMDB_EVENT_NODE; set = 1; } } else if (!xstrncasecmp(argv[i], "User", MAX(command_len, 1))) { if (!event_cond->reason_uid_list) event_cond->reason_uid_list = list_create(xfree_ptr); if (_addto_id_char_list(event_cond->reason_uid_list, argv[i]+end, 0)) { event_cond->event_type = SLURMDB_EVENT_NODE; set = 1; } } else { exit_code=1; fprintf(stderr, " Unknown condition: %s\n", argv[i]); } } (*start) = i; if (!local_cluster_flag && !list_count(event_cond->cluster_list)) { char *temp = slurm_get_cluster_name(); if (temp) list_append(event_cond->cluster_list, temp); } if (!all_time_flag && !event_cond->period_start) { event_cond->period_start = time(NULL); if (!event_cond->state_list) { struct tm start_tm; if (!localtime_r(&event_cond->period_start, &start_tm)) { fprintf(stderr, " Couldn't get localtime from %ld", (long)event_cond->period_start); exit_code=1; return 0; } start_tm.tm_sec = 0; start_tm.tm_min = 0; start_tm.tm_hour = 0; start_tm.tm_mday--; event_cond->period_start = slurm_mktime(&start_tm); } } return set; } extern int sacctmgr_list_event(int argc, char **argv) { int rc = SLURM_SUCCESS; slurmdb_event_cond_t *event_cond = xmalloc(sizeof(slurmdb_event_cond_t)); List event_list = NULL; slurmdb_event_rec_t *event = NULL; int i = 0; ListIterator itr = NULL; ListIterator itr2 = NULL; int field_count = 0; print_field_t *field = NULL; List format_list = list_create(xfree_ptr); List print_fields_list; /* types are of print_field_t */ /* If we don't have any arguments make sure we set up the time correctly for just the past day. */ if (argc == 0) { struct tm start_tm; event_cond->period_start = time(NULL); if (!localtime_r(&event_cond->period_start, &start_tm)) { fprintf(stderr, " Couldn't get localtime from %ld", (long)event_cond->period_start); exit_code = 1; slurmdb_destroy_event_cond(event_cond); return 0; } start_tm.tm_sec = 0; start_tm.tm_min = 0; start_tm.tm_hour = 0; start_tm.tm_mday--; event_cond->period_start = slurm_mktime(&start_tm); } for (i = 0; i < argc; i++) { int command_len = strlen(argv[i]); if (!xstrncasecmp(argv[i], "Where", MAX(command_len, 5)) || !xstrncasecmp(argv[i], "Set", MAX(command_len, 3))) i++; _set_cond(&i, argc, argv, event_cond, format_list); } if (exit_code) { slurmdb_destroy_event_cond(event_cond); FREE_NULL_LIST(format_list); return SLURM_ERROR; } if (!list_count(format_list)) { if (event_cond->event_type == SLURMDB_EVENT_CLUSTER) slurm_addto_char_list(format_list, "Cluster,TRES,Start,End," "ClusterNodes"); else slurm_addto_char_list(format_list, "Cluster,NodeName,Start," "End,State,Reason,User"); } print_fields_list = sacctmgr_process_format_list(format_list); FREE_NULL_LIST(format_list); if (exit_code) { FREE_NULL_LIST(print_fields_list); return SLURM_ERROR; } event_list = slurmdb_events_get(db_conn, event_cond); slurmdb_destroy_event_cond(event_cond); if (!event_list) { exit_code=1; fprintf(stderr, " Error with request: %s\n", slurm_strerror(errno)); FREE_NULL_LIST(print_fields_list); return SLURM_ERROR; } itr = list_iterator_create(event_list); itr2 = list_iterator_create(print_fields_list); print_fields_header(print_fields_list); field_count = list_count(print_fields_list); while((event = list_next(itr))) { int curr_inx = 1; char tmp[20], *tmp_char; time_t newend = event->period_end; while((field = list_next(itr2))) { switch(field->type) { case PRINT_CLUSTER: field->print_routine(field, event->cluster, (curr_inx == field_count)); break; case PRINT_CLUSTER_NODES: field->print_routine( field, event->cluster_nodes, (curr_inx == field_count)); break; case PRINT_CPUS: convert_num_unit( (float)slurmdb_find_tres_count_in_string( event->tres_str, TRES_CPU), tmp, sizeof(tmp), UNIT_NONE, NO_VAL, CONVERT_NUM_UNIT_EXACT); field->print_routine( field, tmp, (curr_inx == field_count)); break; case PRINT_DURATION: if (!newend) newend = time(NULL); field->print_routine( field, (uint64_t)(newend - event->period_start), (curr_inx == field_count)); break; case PRINT_TIMEEND: field->print_routine(field, event->period_end, (curr_inx == field_count)); break; case PRINT_EVENTRAW: field->print_routine(field, event->event_type, (curr_inx == field_count)); break; case PRINT_EVENT: if (event->event_type == SLURMDB_EVENT_CLUSTER) tmp_char = "Cluster"; else if (event->event_type == SLURMDB_EVENT_NODE) tmp_char = "Node"; else tmp_char = "Unknown"; field->print_routine(field, tmp_char, (curr_inx == field_count)); break; case PRINT_NODENAME: field->print_routine(field, event->node_name, (curr_inx == field_count)); break; case PRINT_TIMESTART: field->print_routine(field, event->period_start, (curr_inx == field_count)); break; case PRINT_REASON: field->print_routine(field, event->reason, (curr_inx == field_count)); break; case PRINT_STATERAW: field->print_routine(field, event->state, (curr_inx == field_count)); break; case PRINT_STATE: if (event->event_type == SLURMDB_EVENT_CLUSTER) tmp_char = NULL; else tmp_char = node_state_string_compact( event->state); field->print_routine(field, tmp_char, (curr_inx == field_count)); break; case PRINT_TRES: sacctmgr_initialize_g_tres_list(); tmp_char = slurmdb_make_tres_string_from_simple( event->tres_str, g_tres_list, NO_VAL, CONVERT_NUM_UNIT_EXACT, 0, NULL); field->print_routine( field, tmp_char, (curr_inx == field_count)); xfree(tmp_char); break; case PRINT_USER: if (event->reason_uid != NO_VAL) { tmp_char = uid_to_string_cached( event->reason_uid); snprintf(tmp, sizeof(tmp), "%s(%u)", tmp_char, event->reason_uid); } else memset(tmp, 0, sizeof(tmp)); field->print_routine(field, tmp, (curr_inx == field_count)); break; default: field->print_routine(field, NULL, (curr_inx == field_count)); break; } curr_inx++; } list_iterator_reset(itr2); printf("\n"); } list_iterator_destroy(itr2); list_iterator_destroy(itr); FREE_NULL_LIST(event_list); FREE_NULL_LIST(print_fields_list); return rc; }