pinger.c

来自「lustre 1.6.5 source code」· C语言 代码 · 共 703 行 · 第 1/2 页

C
703
字号
/* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*- * vim:expandtab:shiftwidth=8:tabstop=8: * * Portal-RPC reconnection and replay operations, for use in recovery. * *  Copyright (c) 2003 Cluster File Systems, Inc. *   Authors: Phil Schwan <phil@clusterfs.com> *            Mike Shaver <shaver@clusterfs.com> * *   This file is part of the Lustre file system, http://www.lustre.org *   Lustre is a trademark of Cluster File Systems, Inc. * *   You may have signed or agreed to another license before downloading *   this software.  If so, you are bound by the terms and conditions *   of that agreement, and the following does not apply to you.  See the *   LICENSE file included with this distribution for more information. * *   If you did not agree to a different license, then this copy of Lustre *   is open source software; you can redistribute it and/or modify it *   under the terms of version 2 of the GNU General Public License as *   published by the Free Software Foundation. * *   In either case, Lustre is distributed in the hope that it will be *   useful, but WITHOUT ANY WARRANTY; without even the implied warranty *   of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the *   license text for more details. */#ifndef __KERNEL__#include <liblustre.h>#else#define DEBUG_SUBSYSTEM S_RPC#endif#include <obd_support.h>#include <obd_class.h>#include "ptlrpc_internal.h"struct semaphore pinger_sem;static struct list_head pinger_imports = CFS_LIST_HEAD_INIT(pinger_imports);int ptlrpc_ping(struct obd_import *imp){        struct ptlrpc_request *req;        int rc = 0;        ENTRY;        req = ptlrpc_prep_req(imp, LUSTRE_OBD_VERSION, OBD_PING,                               1, NULL, NULL);        if (req) {                DEBUG_REQ(D_INFO, req, "pinging %s->%s",                          imp->imp_obd->obd_uuid.uuid,                          obd2cli_tgt(imp->imp_obd));                req->rq_no_resend = req->rq_no_delay = 1;                ptlrpc_req_set_repsize(req, 1, NULL);                ptlrpcd_add_req(req);        } else {                CERROR("OOM trying to ping %s->%s\n",                       imp->imp_obd->obd_uuid.uuid,                       obd2cli_tgt(imp->imp_obd));                rc = -ENOMEM;        }        RETURN(rc);}void ptlrpc_update_next_ping(struct obd_import *imp){#ifdef ENABLE_PINGER        int time = PING_INTERVAL;        if (imp->imp_state == LUSTRE_IMP_DISCON) {                int dtime = max_t(int, CONNECTION_SWITCH_MIN,                                  AT_OFF ? 0 :                                  at_get(&imp->imp_at.iat_net_latency));                time = min(time, dtime);        }        imp->imp_next_ping = cfs_time_shift(time);#endif /* ENABLE_PINGER */}void ptlrpc_ping_import_soon(struct obd_import *imp){        imp->imp_next_ping = cfs_time_current();}#ifdef __KERNEL__static int ptlrpc_pinger_main(void *arg){        struct ptlrpc_svc_data *data = (struct ptlrpc_svc_data *)arg;        struct ptlrpc_thread *thread = data->thread;        ENTRY;        cfs_daemonize(data->name);        /* Record that the thread is running */        thread->t_flags = SVC_RUNNING;        cfs_waitq_signal(&thread->t_ctl_waitq);        /* And now, loop forever, pinging as needed. */        while (1) {                cfs_time_t this_ping = cfs_time_current();                struct l_wait_info lwi;                cfs_duration_t time_to_next_ping;                struct list_head *iter;                mutex_down(&pinger_sem);                list_for_each(iter, &pinger_imports) {                        struct obd_import *imp =                                list_entry(iter, struct obd_import,                                           imp_pinger_chain);                        int force, level;                        spin_lock(&imp->imp_lock);                        level = imp->imp_state;                        force = imp->imp_force_verify;                        imp->imp_force_verify = 0;                        spin_unlock(&imp->imp_lock);                        CDEBUG(level == LUSTRE_IMP_FULL ? D_INFO : D_RPCTRACE,                               "level %s/%u force %u deactive %u pingable %u\n",                               ptlrpc_import_state_name(level), level,                               force, imp->imp_deactive, imp->imp_pingable);                        if (force ||                            /* if the next ping is within, say, 5 jiffies from                               now, go ahead and ping. See note below. */                            cfs_time_aftereq(this_ping,                                              imp->imp_next_ping - 5 * CFS_TICK)) {                                if (level == LUSTRE_IMP_DISCON &&                                    !imp->imp_deactive) {                                        /* wait at least a timeout before                                           trying recovery again. */                                        imp->imp_next_ping = cfs_time_shift(obd_timeout);                                        ptlrpc_initiate_recovery(imp);                                } else if (level != LUSTRE_IMP_FULL ||                                         imp->imp_obd->obd_no_recov ||                                         imp->imp_deactive) {                                        CDEBUG(D_HA, "not pinging %s "                                               "(in recovery: %s or recovery "                                               "disabled: %u/%u)\n",                                               obd2cli_tgt(imp->imp_obd),                                               ptlrpc_import_state_name(level),                                               imp->imp_deactive,                                               imp->imp_obd->obd_no_recov);                                } else if (imp->imp_pingable || force) {                                        ptlrpc_ping(imp);                                }                        } else {                                if (!imp->imp_pingable)                                        continue;                                CDEBUG(D_INFO,                                       "don't need to ping %s ("CFS_TIME_T                                       " > "CFS_TIME_T")\n",                                       obd2cli_tgt(imp->imp_obd),                                       imp->imp_next_ping, this_ping);                        }                        /* obd_timeout might have changed */                        if (cfs_time_after(imp->imp_next_ping,                                           cfs_time_add(this_ping,                                                         cfs_time_seconds(PING_INTERVAL))))                                ptlrpc_update_next_ping(imp);                }                mutex_up(&pinger_sem);                /* update memory usage info */                obd_update_maxusage();                /* Wait until the next ping time, or until we're stopped. */                time_to_next_ping = cfs_time_sub(cfs_time_add(this_ping,                                                               cfs_time_seconds(PING_INTERVAL)),                                                  cfs_time_current());                /* The ping sent by ptlrpc_send_rpc may get sent out                   say .01 second after this.                   ptlrpc_pinger_eending_on_import will then set the                   next ping time to next_ping + .01 sec, which means                   we will SKIP the next ping at next_ping, and the                   ping will get sent 2 timeouts from now!  Beware. */                CDEBUG(D_INFO, "next ping in "CFS_DURATION_T" ("CFS_TIME_T")\n",                                time_to_next_ping,                                cfs_time_add(this_ping, cfs_time_seconds(PING_INTERVAL)));                if (time_to_next_ping > 0) {                        lwi = LWI_TIMEOUT(max_t(cfs_duration_t, time_to_next_ping, cfs_time_seconds(1)),                                          NULL, NULL);                        l_wait_event(thread->t_ctl_waitq,                                     thread->t_flags & (SVC_STOPPING|SVC_EVENT),                                     &lwi);                        if (thread->t_flags & SVC_STOPPING) {                                thread->t_flags &= ~SVC_STOPPING;                                EXIT;                                break;                        } else if (thread->t_flags & SVC_EVENT) {                                /* woken after adding import to reset timer */                                thread->t_flags &= ~SVC_EVENT;                        }                }        }        thread->t_flags = SVC_STOPPED;        cfs_waitq_signal(&thread->t_ctl_waitq);        CDEBUG(D_NET, "pinger thread exiting, process %d\n", cfs_curproc_pid());        return 0;}static struct ptlrpc_thread *pinger_thread = NULL;int ptlrpc_start_pinger(void){        struct l_wait_info lwi = { 0 };        struct ptlrpc_svc_data d;        int rc;#ifndef ENABLE_PINGER        return 0;#endif        ENTRY;        if (pinger_thread != NULL)                RETURN(-EALREADY);        OBD_ALLOC(pinger_thread, sizeof(*pinger_thread));        if (pinger_thread == NULL)                RETURN(-ENOMEM);        cfs_waitq_init(&pinger_thread->t_ctl_waitq);        d.name = "ll_ping";        d.thread = pinger_thread;        /* CLONE_VM and CLONE_FILES just avoid a needless copy, because we         * just drop the VM and FILES in ptlrpc_daemonize() right away. */        rc = cfs_kernel_thread(ptlrpc_pinger_main, &d, CLONE_VM | CLONE_FILES);        if (rc < 0) {                CERROR("cannot start thread: %d\n", rc);                OBD_FREE(pinger_thread, sizeof(*pinger_thread));                pinger_thread = NULL;                RETURN(rc);        }        l_wait_event(pinger_thread->t_ctl_waitq,                     pinger_thread->t_flags & SVC_RUNNING, &lwi);        RETURN(0);}int ptlrpc_stop_pinger(void){        struct l_wait_info lwi = { 0 };        int rc = 0;#ifndef ENABLE_PINGER        return 0;#endif        ENTRY;        if (pinger_thread == NULL)                RETURN(-EALREADY);        mutex_down(&pinger_sem);        pinger_thread->t_flags = SVC_STOPPING;        cfs_waitq_signal(&pinger_thread->t_ctl_waitq);        mutex_up(&pinger_sem);        l_wait_event(pinger_thread->t_ctl_waitq,                     (pinger_thread->t_flags & SVC_STOPPED), &lwi);        OBD_FREE(pinger_thread, sizeof(*pinger_thread));        pinger_thread = NULL;        RETURN(rc);}void ptlrpc_pinger_sending_on_import(struct obd_import *imp){        ptlrpc_update_next_ping(imp);}int ptlrpc_pinger_add_import(struct obd_import *imp){        ENTRY;        if (!list_empty(&imp->imp_pinger_chain))                RETURN(-EALREADY);        mutex_down(&pinger_sem);        CDEBUG(D_HA, "adding pingable import %s->%s\n",               imp->imp_obd->obd_uuid.uuid, obd2cli_tgt(imp->imp_obd));        /* if we add to pinger we want recovery on this import */        imp->imp_obd->obd_no_recov = 0;        ptlrpc_update_next_ping(imp);        /* XXX sort, blah blah */        list_add_tail(&imp->imp_pinger_chain, &pinger_imports);        class_import_get(imp);        ptlrpc_pinger_wake_up();        mutex_up(&pinger_sem);        RETURN(0);}int ptlrpc_pinger_del_import(struct obd_import *imp){        ENTRY;        if (list_empty(&imp->imp_pinger_chain))                RETURN(-ENOENT);        mutex_down(&pinger_sem);        list_del_init(&imp->imp_pinger_chain);        CDEBUG(D_HA, "removing pingable import %s->%s\n",               imp->imp_obd->obd_uuid.uuid, obd2cli_tgt(imp->imp_obd));        /* if we remove from pinger we don't want recovery on this import */        imp->imp_obd->obd_no_recov = 1;        class_import_put(imp);        mutex_up(&pinger_sem);        RETURN(0);}void ptlrpc_pinger_wake_up(){#ifdef ENABLE_PINGER        pinger_thread->t_flags |= SVC_EVENT;        cfs_waitq_signal(&pinger_thread->t_ctl_waitq);#endif}/* Ping evictor thread */#define PET_READY     1#define PET_TERMINATE 2static int               pet_refcount = 0;static int               pet_state;static wait_queue_head_t pet_waitq;static struct obd_export *pet_exp = NULL;static spinlock_t        pet_lock = SPIN_LOCK_UNLOCKED;int ping_evictor_wake(struct obd_export *exp){        spin_lock(&pet_lock);        if (pet_exp || (pet_state != PET_READY)) {                /* eventually the new obd will call here again. */                spin_unlock(&pet_lock);                return 1;        }        /* We have to make sure the obd isn't destroyed between now and when         * the ping evictor runs.  We'll take a reference here, and drop it         * when we finish in the evictor.  We don't really care about this         * export in particular; we just need one to keep the obd alive. */        pet_exp = class_export_get(exp);        spin_unlock(&pet_lock);        wake_up(&pet_waitq);        return 0;}static int ping_evictor_main(void *arg){

⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?