📄 mom_mach.c
字号:
/** OpenPBS (Portable Batch System) v2.3 Software License* * Copyright (c) 1999-2000 Veridian Information Solutions, Inc.* All rights reserved.* * ---------------------------------------------------------------------------* For a license to use or redistribute the OpenPBS software under conditions* other than those described below, or to purchase support for this software,* please contact Veridian Systems, PBS Products Department ("Licensor") at:* * www.OpenPBS.org +1 650 967-4675 sales@OpenPBS.org* 877 902-4PBS (US toll-free)* ---------------------------------------------------------------------------* * This license covers use of the OpenPBS v2.3 software (the "Software") at* your site or location, and, for certain users, redistribution of the* Software to other sites and locations. Use and redistribution of* OpenPBS v2.3 in source and binary forms, with or without modification,* are permitted provided that all of the following conditions are met.* After December 31, 2001, only conditions 3-6 must be met:* * 1. Commercial and/or non-commercial use of the Software is permitted* provided a current software registration is on file at www.OpenPBS.org.* If use of this software contributes to a publication, product, or* service, proper attribution must be given; see www.OpenPBS.org/credit.html* * 2. Redistribution in any form is only permitted for non-commercial,* non-profit purposes. There can be no charge for the Software or any* software incorporating the Software. Further, there can be no* expectation of revenue generated as a consequence of redistributing* the Software.* * 3. Any Redistribution of source code must retain the above copyright notice* and the acknowledgment contained in paragraph 6, this list of conditions* and the disclaimer contained in paragraph 7.* * 4. Any Redistribution in binary form must reproduce the above copyright* notice and the acknowledgment contained in paragraph 6, this list of* conditions and the disclaimer contained in paragraph 7 in the* documentation and/or other materials provided with the distribution.* * 5. Redistributions in any form must be accompanied by information on how to* obtain complete source code for the OpenPBS software and any* modifications and/or additions to the OpenPBS software. The source code* must either be included in the distribution or be available for no more* than the cost of distribution plus a nominal fee, and all modifications* and additions to the Software must be freely redistributable by any party* (including Licensor) without restriction.* * 6. All advertising materials mentioning features or use of the Software must* display the following acknowledgment:* * "This product includes software developed by NASA Ames Research Center,* Lawrence Livermore National Laboratory, and Veridian Information * Solutions, Inc.* Visit www.OpenPBS.org for OpenPBS software support,* products, and information."* * 7. DISCLAIMER OF WARRANTY* * THIS SOFTWARE IS PROVIDED "AS IS" WITHOUT WARRANTY OF ANY KIND. ANY EXPRESS* OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES* OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE, AND NON-INFRINGEMENT* ARE EXPRESSLY DISCLAIMED.* * IN NO EVENT SHALL VERIDIAN CORPORATION, ITS AFFILIATED COMPANIES, OR THE* U.S. GOVERNMENT OR ANY OF ITS AGENCIES BE LIABLE FOR ANY DIRECT OR INDIRECT,* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA,* OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF* LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING* NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE,* EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.* * This license will be governed by the laws of the Commonwealth of Virginia,* without reference to its choice of law rules.*//*** System dependent code to gather information for a Sun machine.**** Resources known by this code:** cput cpu time for a pid or session** mem memory size for a pid or session in KB** resi resident memory size for a pid or session in KB** sessions list of sessions in the system** pids list of pids in a session** nsessions number of sessions in the system** nusers number of users in the system** totmem total memory size in KB** availmem available memory size in KB** physmem physical memory size in KB** size size of a file or filesystem in KB** idletime seconds of idle time** walltime wall clock time for a pid** loadave current load average** quota quota information (sizes in KB)*/#include <pbs_config.h> /* the master config generated by configure */#include <assert.h>#include <limits.h>#include <stdio.h>#include <stdlib.h>#include <ctype.h>#include <dirent.h>#include <string.h>#include <fcntl.h>#include <errno.h>#include <pwd.h>#include <mntent.h>#include <sys/types.h>#include <sys/time.h>#include <sys/param.h>#include <sys/file.h>#include <sys/stat.h>#include <sys/vfs.h>#include <sys/user.h>#include <sys/uio.h>#include <sys/proc.h>#include <sys/session.h>#include <sys/vnode.h>#include <ufs/inode.h>#include <sys/stream.h>#include <sys/stropts.h>#include <nlist.h>#include <vm/anon.h>#include <ufs/quota.h>#include <kvm.h>#include "portability.h"#include "pbs_error.h"#include "log.h"#include "list_link.h"#include "server_limits.h"#include "attribute.h"#include "resource.h"#include "job.h"#include "mom_mach.h"#include "resmon.h"#include "../rm_dep.h"static char ident[] = "@(#) sun/$RCSfile: mom_mach.c,v $ $Revision: 2.7.4.4 $";#ifndef TRUE#define FALSE 0#define TRUE 1#endif /* TRUE *//*** external functions and data*/extern struct config *search A_((struct config *, char *));extern struct rm_attribute *momgetattr A_((char *));extern int rm_errno;extern unsigned int reqnum;extern double cputfactor;extern double wallfactor;/*** local functions*/static char *resi A_((struct rm_attribute *attrib));static char *totmem A_((struct rm_attribute *attrib));static char *availmem A_((struct rm_attribute *attrib));static char *physmem A_((struct rm_attribute *attrib));static char *walltime A_((struct rm_attribute *attrib));static char *quota A_((struct rm_attribute *attrib));extern char *loadave A_((struct rm_attribute *attrib));extern char *nullproc A_((struct rm_attribute *attrib));struct config dependent_config[] = { { "resi", resi }, { "totmem", totmem }, { "availmem", availmem }, { "physmem", physmem }, { "loadave", loadave }, { "walltime", walltime }, { "quota", quota }, { NULL, nullproc }};struct nlist nl[] = { { "_proc" }, /* 0 */ { "_nproc" }, /* 1 */ { "_anoninfo" }, /* 2 */ { "_physmem" }, /* 3 */ { "_avenrun" }, /* 4 */ { "" }};#define KSYM_PROC 0#define KSYM_NPROC 1#define KSYM_ANON 2#define KSYM_PHYS 3#define KSYM_LOAD 4time_t wait_time = 10;kvm_t *kd = NULL;struct proc *proc_tbl = NULL;pid_t *sess_tbl = NULL;int nproc = 0;extern char *ret_string;extern char extra_parm[];extern char no_parm[];char nokernel[] = "kernel not available";char noproc[] = "process %d does not exist";voiddep_initialize(){ char *id = "dep_initialize"; if (kd == NULL) { if ((kd = kvm_open(NULL, NULL, NULL, O_RDONLY, "rm")) == NULL) { log_err(errno, id, "kvm_open"); return; } } if (kvm_nlist(kd, nl) == -1) { log_err(errno, id, "kvm_nlist"); return; } return;}voiddep_cleanup(){ char *id = "dep_cleanup"; log_record(PBSEVENT_SYSTEM, 0, id, "dependent cleanup"); if (kd) kvm_close(kd); kd = NULL;}voidend_proc(){ return;}extern struct pbs_err_to_txt pbs_err_to_txt[];extern time_t time_now;/* * Time decoding macro. Accepts a timeval structure. Returns unsigned long * time in seconds. (tv_usec is in microseconds) */#define tv(val) ((val).tv_sec + ((unsigned long)(val).tv_usec + 500000)/1000000)/* * Internal size decoding routine. * * Accepts a resource pointer and a pointer to the unsigned long integer * to receive the decoded value. It returns a PBS error code, and the * decoded value in the unsigned long integer. * * For SunOS, * * sizeof(word) = sizeof(int) */static int getsize(pres, ret) resource *pres; unsigned long *ret;{ unsigned long value; if (pres->rs_value.at_type != ATR_TYPE_SIZE) return (PBSE_ATTRTYPE); value = pres->rs_value.at_val.at_size.atsv_num; if (pres->rs_value.at_val.at_size.atsv_units == ATR_SV_WORDSZ) { if (value > ULONG_MAX / sizeof(int)) return (PBSE_BADATVAL); value *= sizeof(int); } if (value > ULONG_MAX >> pres->rs_value.at_val.at_size.atsv_shift) return (PBSE_BADATVAL); *ret = value << pres->rs_value.at_val.at_size.atsv_shift; return (PBSE_NONE);}/* * Internal time decoding routine. * * Accepts a resource pointer and a pointer to the unsigned long integer * to receive the decoded value. It returns a PBS error code, and the * decoded value of time in seconds in the unsigned long integer. */static int gettime(pres, ret) resource *pres; unsigned long *ret;{ if (pres->rs_value.at_type != ATR_TYPE_LONG) return (PBSE_ATTRTYPE); if (pres->rs_value.at_val.at_long < 0) return (PBSE_BADATVAL); *ret = pres->rs_value.at_val.at_long; return (PBSE_NONE);}/*** Scan a list of tasks and return true if one of them matches** the process (sid or pid) represented by *psp.*/staticintinjob(pjob, sesid) job *pjob; pid_t sesid;{ task *ptask; for (ptask = (task *)GET_NEXT(pjob->ji_tasks); ptask; ptask = (task *)GET_NEXT(ptask->ti_jobtask)) { if (ptask->ti_qs.ti_sid <= 1) continue; if (ptask->ti_qs.ti_sid == sesid) return TRUE; } return FALSE;}#define MINPROC 10#define MAXPROC 10000/* * Internal session cpu time decoding routine. * * Accepts a session id. Returns the sum of all cpu time consumed for all * tasks executed by the job, in seconds, adjusted by cputfactor. */static unsigned long cput_sum(pjob) job *pjob;{ char *id = "cput_sum"; int i; register struct user *uarea; unsigned long cputime; int nps = 0; cputime = 0; for (i=0; i<nproc; i++) { register struct proc *pp = &proc_tbl[i]; if (pp->p_stat==0) continue; if (!injob(pjob, sess_tbl[i])) continue; nps++; if (pp->p_ru == NULL) { if ((uarea = kvm_getu(kd, pp)) == NULL) continue; else { cputime += tv(uarea->u_ru.ru_utime) + tv(uarea->u_ru.ru_stime) + tv(uarea->u_cru.ru_utime) + tv(uarea->u_cru.ru_stime); } } else { struct rusage ru; if (kvm_read(kd, (unsigned long)pp->p_ru, (char *)&ru, sizeof(ru)) != sizeof(ru)) { log_err(errno, id, "kvm_read(session)"); continue; } cputime += tv(ru.ru_utime) + tv(ru.ru_stime); } DBPRT(("%s: ses %d pid %d cputime %d\n", id, sess_tbl[i], pp->p_pid, cputime)) } if (nps == 0) pjob->ji_flags |= MOM_NO_PROC; return ((unsigned long)((double)cputime * cputfactor));}/* * Internal session memory usage function. * * Accepts a job ID. Returns the total number of bytes of address * space consumed by all current tasks within the job. */static unsigned long mem_sum(pjob) job *pjob;{ char *id="mem_sum"; int i; unsigned long memsize; memsize = 0; for (i=0; i<nproc; i++) { register struct proc *pp = &proc_tbl[i]; if (pp->p_stat==0) continue; if (!injob(pjob, sess_tbl[i])) continue; memsize += ctob(pp->p_tsize + pp->p_dsize + pp->p_ssize); DBPRT(("%s: ses %d pid=%d uid=%d totmem=%lu\n", id, sess_tbl[i], pp->p_pid, pp->p_uid, memsize)) } return (memsize);}/* * Internal session workingset size function. */static unsigned long resi_sum(pjob) job *pjob;{ char *id="resi_sum"; int i; unsigned long memsize; memsize = 0; for (i=0; i<nproc; i++) { register struct proc *pp = &proc_tbl[i]; if (pp->p_stat==0) continue; if (!injob(pjob, sess_tbl[i])) continue; memsize += ctob(pp->p_rssize); DBPRT(("%s: pid=%d ses=%d uid=%d mem=%d totmem=%d\n", id, pp->p_pid, sess_tbl[i], pp->p_uid, pp->p_rssize, memsize)) } return (memsize);}/* * Return TRUE if any task in the job is over limit for memory usage. */static int overmem_proc(pjob, limit) job *pjob; unsigned long limit;{ int i; for (i=0; i<nproc; i++) { register struct proc *pp = &proc_tbl[i]; if (pp->p_stat==0) continue; if (!injob(pjob, sess_tbl[i])) continue; if (ctob(pp->p_tsize + pp->p_dsize + pp->p_ssize) > limit) return (TRUE); } return (FALSE);}extern char *msg_momsetlim;/* * Internal error routine */int error(string, value) char *string; int value;{ int i = 0; char *message; assert(string != NULL); assert(*string != '\0'); assert(value > PBSE_); /* minimum PBS error number */ assert(value <= PBSE_NOSYNCMSTR); /* maximum PBS error number */ assert(pbs_err_to_txt[i].err_no != 0); do { if (pbs_err_to_txt[i].err_no == value) break; } while (pbs_err_to_txt[++i].err_no != 0); assert(pbs_err_to_txt[i].err_txt != NULL); message = *pbs_err_to_txt[i].err_txt; assert(message != NULL); assert(*message != '\0'); (void)fprintf(stderr, msg_momsetlim, string, message); (void)fflush(stderr); return (value);}/* * Establish system-enforced limits for the job. * * Run through the resource list, checking the values for all items * we recognize. * * If set_mode is SET_LIMIT_SET, then also set hard limits for the * system enforced limits (not-polled). * If anything goes wrong with the process, return a PBS error code * and print a message on standard error. A zero-length resource list * is not an error. * * If set_mode is SET_LIMIT_SET the entry conditions are: * 1. MOM has already forked, and we are called from the child.
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -