4 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 only,
8 * as published by the Free Software Foundation.
10 * This program is distributed in the hope that it will be useful, but
11 * WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * General Public License version 2 for more details (a copy is included
14 * in the LICENSE file that accompanied this code).
16 * You should have received a copy of the GNU General Public License
17 * version 2 along with this program; If not, see
18 * http://www.gnu.org/licenses/gpl-2.0.html
23 * Copyright (c) 2007, 2010, Oracle and/or its affiliates. All rights reserved.
24 * Use is subject to license terms.
26 * Copyright (c) 2011, 2012, Intel Corporation.
29 * This file is part of Lustre, http://www.lustre.org/
30 * Lustre is a trademark of Sun Microsystems, Inc.
32 * lnet/selftest/conctl.c
34 * Console framework rpcs
36 * Author: Liang Zhen <liang@whamcloud.com>
39 #include <linux/libcfs/libcfs.h>
40 #include <linux/lnet/lib-lnet.h>
45 void lstcon_rpc_stat_reply(struct lstcon_rpc_trans *, struct srpc_msg *,
46 struct lstcon_node *, struct lstcon_trans_stat *);
49 lstcon_rpc_done(struct srpc_client_rpc *rpc)
51 struct lstcon_rpc *crpc = (struct lstcon_rpc *)rpc->crpc_priv;
53 LASSERT(crpc && rpc == crpc->crp_rpc);
54 LASSERT(crpc->crp_posted && !crpc->crp_finished);
56 spin_lock(&rpc->crpc_lock);
58 if (!crpc->crp_trans) {
60 * Orphan RPC is not in any transaction,
61 * I'm just a poor body and nobody loves me
63 spin_unlock(&rpc->crpc_lock);
70 /* not an orphan RPC */
71 crpc->crp_finished = 1;
73 if (!crpc->crp_stamp) {
75 LASSERT(!crpc->crp_status);
77 crpc->crp_stamp = cfs_time_current();
78 crpc->crp_status = rpc->crpc_status;
81 /* wakeup (transaction)thread if I'm the last RPC in the transaction */
82 if (atomic_dec_and_test(&crpc->crp_trans->tas_remaining))
83 wake_up(&crpc->crp_trans->tas_waitq);
85 spin_unlock(&rpc->crpc_lock);
89 lstcon_rpc_init(struct lstcon_node *nd, int service, unsigned int feats,
90 int bulk_npg, int bulk_len, int embedded,
91 struct lstcon_rpc *crpc)
93 crpc->crp_rpc = sfw_create_rpc(nd->nd_id, service,
94 feats, bulk_npg, bulk_len,
95 lstcon_rpc_done, (void *)crpc);
99 crpc->crp_trans = NULL;
101 crpc->crp_posted = 0;
102 crpc->crp_finished = 0;
103 crpc->crp_unpacked = 0;
104 crpc->crp_status = 0;
106 crpc->crp_embedded = embedded;
107 INIT_LIST_HEAD(&crpc->crp_link);
109 atomic_inc(&console_session.ses_rpc_counter);
115 lstcon_rpc_prep(struct lstcon_node *nd, int service, unsigned int feats,
116 int bulk_npg, int bulk_len, struct lstcon_rpc **crpcpp)
118 struct lstcon_rpc *crpc = NULL;
121 spin_lock(&console_session.ses_rpc_lock);
123 crpc = list_first_entry_or_null(&console_session.ses_rpc_freelist,
124 struct lstcon_rpc, crp_link);
126 list_del_init(&crpc->crp_link);
128 spin_unlock(&console_session.ses_rpc_lock);
131 LIBCFS_ALLOC(crpc, sizeof(*crpc));
136 rc = lstcon_rpc_init(nd, service, feats, bulk_npg, bulk_len, 0, crpc);
142 LIBCFS_FREE(crpc, sizeof(*crpc));
148 lstcon_rpc_put(struct lstcon_rpc *crpc)
150 struct srpc_bulk *bulk = &crpc->crp_rpc->crpc_bulk;
153 LASSERT(list_empty(&crpc->crp_link));
155 for (i = 0; i < bulk->bk_niov; i++) {
156 if (!bulk->bk_iovs[i].bv_page)
159 __free_page(bulk->bk_iovs[i].bv_page);
162 srpc_client_rpc_decref(crpc->crp_rpc);
164 if (crpc->crp_embedded) {
165 /* embedded RPC, don't recycle it */
166 memset(crpc, 0, sizeof(*crpc));
167 crpc->crp_embedded = 1;
170 spin_lock(&console_session.ses_rpc_lock);
172 list_add(&crpc->crp_link,
173 &console_session.ses_rpc_freelist);
175 spin_unlock(&console_session.ses_rpc_lock);
178 /* RPC is not alive now */
179 atomic_dec(&console_session.ses_rpc_counter);
183 lstcon_rpc_post(struct lstcon_rpc *crpc)
185 struct lstcon_rpc_trans *trans = crpc->crp_trans;
189 atomic_inc(&trans->tas_remaining);
190 crpc->crp_posted = 1;
192 sfw_post_rpc(crpc->crp_rpc);
196 lstcon_rpc_trans_name(int transop)
198 if (transop == LST_TRANS_SESNEW)
201 if (transop == LST_TRANS_SESEND)
204 if (transop == LST_TRANS_SESQRY)
207 if (transop == LST_TRANS_SESPING)
210 if (transop == LST_TRANS_TSBCLIADD)
213 if (transop == LST_TRANS_TSBSRVADD)
216 if (transop == LST_TRANS_TSBRUN)
219 if (transop == LST_TRANS_TSBSTOP)
222 if (transop == LST_TRANS_TSBCLIQRY)
225 if (transop == LST_TRANS_TSBSRVQRY)
228 if (transop == LST_TRANS_STATQRY)
235 lstcon_rpc_trans_prep(struct list_head *translist, int transop,
236 struct lstcon_rpc_trans **transpp)
238 struct lstcon_rpc_trans *trans;
241 list_for_each_entry(trans, translist, tas_link) {
243 * Can't enqueue two private transaction on
246 if ((trans->tas_opc & transop) == LST_TRANS_PRIVATE)
251 /* create a trans group */
252 LIBCFS_ALLOC(trans, sizeof(*trans));
256 trans->tas_opc = transop;
259 INIT_LIST_HEAD(&trans->tas_olink);
261 list_add_tail(&trans->tas_olink, translist);
263 list_add_tail(&trans->tas_link, &console_session.ses_trans_list);
265 INIT_LIST_HEAD(&trans->tas_rpcs_list);
266 atomic_set(&trans->tas_remaining, 0);
267 init_waitqueue_head(&trans->tas_waitq);
269 spin_lock(&console_session.ses_rpc_lock);
270 trans->tas_features = console_session.ses_features;
271 spin_unlock(&console_session.ses_rpc_lock);
278 lstcon_rpc_trans_addreq(struct lstcon_rpc_trans *trans, struct lstcon_rpc *crpc)
280 list_add_tail(&crpc->crp_link, &trans->tas_rpcs_list);
281 crpc->crp_trans = trans;
285 lstcon_rpc_trans_abort(struct lstcon_rpc_trans *trans, int error)
287 struct srpc_client_rpc *rpc;
288 struct lstcon_rpc *crpc;
289 struct lstcon_node *nd;
291 list_for_each_entry(crpc, &trans->tas_rpcs_list, crp_link) {
294 spin_lock(&rpc->crpc_lock);
296 if (!crpc->crp_posted || /* not posted */
297 crpc->crp_stamp) { /* rpc done or aborted already */
298 if (!crpc->crp_stamp) {
299 crpc->crp_stamp = cfs_time_current();
300 crpc->crp_status = -EINTR;
302 spin_unlock(&rpc->crpc_lock);
306 crpc->crp_stamp = cfs_time_current();
307 crpc->crp_status = error;
309 spin_unlock(&rpc->crpc_lock);
313 if (error != -ETIMEDOUT)
317 if (cfs_time_after(nd->nd_stamp, crpc->crp_stamp))
320 nd->nd_stamp = crpc->crp_stamp;
321 nd->nd_state = LST_NODE_DOWN;
326 lstcon_rpc_trans_check(struct lstcon_rpc_trans *trans)
328 if (console_session.ses_shutdown &&
329 !list_empty(&trans->tas_olink)) /* Not an end session RPC */
332 return !atomic_read(&trans->tas_remaining) ? 1 : 0;
336 lstcon_rpc_trans_postwait(struct lstcon_rpc_trans *trans, int timeout)
338 struct lstcon_rpc *crpc;
341 if (list_empty(&trans->tas_rpcs_list))
344 if (timeout < LST_TRANS_MIN_TIMEOUT)
345 timeout = LST_TRANS_MIN_TIMEOUT;
347 CDEBUG(D_NET, "Transaction %s started\n",
348 lstcon_rpc_trans_name(trans->tas_opc));
350 /* post all requests */
351 list_for_each_entry(crpc, &trans->tas_rpcs_list, crp_link) {
352 LASSERT(!crpc->crp_posted);
354 lstcon_rpc_post(crpc);
357 mutex_unlock(&console_session.ses_mutex);
359 rc = wait_event_interruptible_timeout(trans->tas_waitq,
360 lstcon_rpc_trans_check(trans),
361 cfs_time_seconds(timeout));
362 rc = (rc > 0) ? 0 : ((rc < 0) ? -EINTR : -ETIMEDOUT);
364 mutex_lock(&console_session.ses_mutex);
366 if (console_session.ses_shutdown)
369 if (rc || atomic_read(&trans->tas_remaining)) {
370 /* treat short timeout as canceled */
371 if (rc == -ETIMEDOUT && timeout < LST_TRANS_MIN_TIMEOUT * 2)
374 lstcon_rpc_trans_abort(trans, rc);
377 CDEBUG(D_NET, "Transaction %s stopped: %d\n",
378 lstcon_rpc_trans_name(trans->tas_opc), rc);
380 lstcon_rpc_trans_stat(trans, lstcon_trans_stat());
386 lstcon_rpc_get_reply(struct lstcon_rpc *crpc, struct srpc_msg **msgpp)
388 struct lstcon_node *nd = crpc->crp_node;
389 struct srpc_client_rpc *rpc = crpc->crp_rpc;
390 struct srpc_generic_reply *rep;
393 LASSERT(crpc->crp_stamp);
395 if (crpc->crp_status) {
397 return crpc->crp_status;
400 *msgpp = &rpc->crpc_replymsg;
401 if (!crpc->crp_unpacked) {
402 sfw_unpack_message(*msgpp);
403 crpc->crp_unpacked = 1;
406 if (cfs_time_after(nd->nd_stamp, crpc->crp_stamp))
409 nd->nd_stamp = crpc->crp_stamp;
410 rep = &(*msgpp)->msg_body.reply;
412 if (rep->sid.ses_nid == LNET_NID_ANY)
413 nd->nd_state = LST_NODE_UNKNOWN;
414 else if (lstcon_session_match(rep->sid))
415 nd->nd_state = LST_NODE_ACTIVE;
417 nd->nd_state = LST_NODE_BUSY;
423 lstcon_rpc_trans_stat(struct lstcon_rpc_trans *trans, struct lstcon_trans_stat *stat)
425 struct lstcon_rpc *crpc;
426 struct srpc_msg *rep;
431 memset(stat, 0, sizeof(*stat));
433 list_for_each_entry(crpc, &trans->tas_rpcs_list, crp_link) {
434 lstcon_rpc_stat_total(stat, 1);
436 LASSERT(crpc->crp_stamp);
438 error = lstcon_rpc_get_reply(crpc, &rep);
440 lstcon_rpc_stat_failure(stat, 1);
441 if (!stat->trs_rpc_errno)
442 stat->trs_rpc_errno = -error;
447 lstcon_rpc_stat_success(stat, 1);
449 lstcon_rpc_stat_reply(trans, rep, crpc->crp_node, stat);
452 if (trans->tas_opc == LST_TRANS_SESNEW && !stat->trs_fwk_errno) {
453 stat->trs_fwk_errno =
454 lstcon_session_feats_check(trans->tas_features);
457 CDEBUG(D_NET, "transaction %s : success %d, failure %d, total %d, RPC error(%d), Framework error(%d)\n",
458 lstcon_rpc_trans_name(trans->tas_opc),
459 lstcon_rpc_stat_success(stat, 0),
460 lstcon_rpc_stat_failure(stat, 0),
461 lstcon_rpc_stat_total(stat, 0),
462 stat->trs_rpc_errno, stat->trs_fwk_errno);
466 lstcon_rpc_trans_interpreter(struct lstcon_rpc_trans *trans,
467 struct list_head __user *head_up,
468 lstcon_rpc_readent_func_t readent)
470 struct list_head tmp;
471 struct list_head __user *next;
472 struct lstcon_rpc_ent *ent;
473 struct srpc_generic_reply *rep;
474 struct lstcon_rpc *crpc;
475 struct srpc_msg *msg;
476 struct lstcon_node *nd;
485 list_for_each_entry(crpc, &trans->tas_rpcs_list, crp_link) {
486 if (copy_from_user(&tmp, next,
487 sizeof(struct list_head)))
494 ent = list_entry(next, struct lstcon_rpc_ent, rpe_link);
496 LASSERT(crpc->crp_stamp);
498 error = lstcon_rpc_get_reply(crpc, &msg);
502 dur = (long)cfs_time_sub(crpc->crp_stamp,
503 (unsigned long)console_session.ses_id.ses_stamp);
504 jiffies_to_timeval(dur, &tv);
506 if (copy_to_user(&ent->rpe_peer, &nd->nd_id,
507 sizeof(struct lnet_process_id)) ||
508 copy_to_user(&ent->rpe_stamp, &tv, sizeof(tv)) ||
509 copy_to_user(&ent->rpe_state, &nd->nd_state,
510 sizeof(nd->nd_state)) ||
511 copy_to_user(&ent->rpe_rpc_errno, &error,
519 rep = (struct srpc_generic_reply *)&msg->msg_body.reply;
521 if (copy_to_user(&ent->rpe_sid, &rep->sid, sizeof(rep->sid)) ||
522 copy_to_user(&ent->rpe_fwk_errno, &rep->status,
523 sizeof(rep->status)))
529 error = readent(trans->tas_opc, msg, ent);
538 lstcon_rpc_trans_destroy(struct lstcon_rpc_trans *trans)
540 struct srpc_client_rpc *rpc;
541 struct lstcon_rpc *crpc;
542 struct lstcon_rpc *tmp;
545 list_for_each_entry_safe(crpc, tmp, &trans->tas_rpcs_list, crp_link) {
548 spin_lock(&rpc->crpc_lock);
550 /* free it if not posted or finished already */
551 if (!crpc->crp_posted || crpc->crp_finished) {
552 spin_unlock(&rpc->crpc_lock);
554 list_del_init(&crpc->crp_link);
555 lstcon_rpc_put(crpc);
561 * rpcs can be still not callbacked (even LNetMDUnlink is
562 * called) because huge timeout for inaccessible network,
563 * don't make user wait for them, just abandon them, they
564 * will be recycled in callback
566 LASSERT(crpc->crp_status);
568 crpc->crp_node = NULL;
569 crpc->crp_trans = NULL;
570 list_del_init(&crpc->crp_link);
573 spin_unlock(&rpc->crpc_lock);
575 atomic_dec(&trans->tas_remaining);
578 LASSERT(!atomic_read(&trans->tas_remaining));
580 list_del(&trans->tas_link);
581 if (!list_empty(&trans->tas_olink))
582 list_del(&trans->tas_olink);
584 CDEBUG(D_NET, "Transaction %s destroyed with %d pending RPCs\n",
585 lstcon_rpc_trans_name(trans->tas_opc), count);
587 LIBCFS_FREE(trans, sizeof(*trans));
591 lstcon_sesrpc_prep(struct lstcon_node *nd, int transop,
592 unsigned int feats, struct lstcon_rpc **crpc)
594 struct srpc_mksn_reqst *msrq;
595 struct srpc_rmsn_reqst *rsrq;
599 case LST_TRANS_SESNEW:
600 rc = lstcon_rpc_prep(nd, SRPC_SERVICE_MAKE_SESSION,
605 msrq = &(*crpc)->crp_rpc->crpc_reqstmsg.msg_body.mksn_reqst;
606 msrq->mksn_sid = console_session.ses_id;
607 msrq->mksn_force = console_session.ses_force;
608 strlcpy(msrq->mksn_name, console_session.ses_name,
609 sizeof(msrq->mksn_name));
612 case LST_TRANS_SESEND:
613 rc = lstcon_rpc_prep(nd, SRPC_SERVICE_REMOVE_SESSION,
618 rsrq = &(*crpc)->crp_rpc->crpc_reqstmsg.msg_body.rmsn_reqst;
619 rsrq->rmsn_sid = console_session.ses_id;
630 lstcon_dbgrpc_prep(struct lstcon_node *nd, unsigned int feats,
631 struct lstcon_rpc **crpc)
633 struct srpc_debug_reqst *drq;
636 rc = lstcon_rpc_prep(nd, SRPC_SERVICE_DEBUG, feats, 0, 0, crpc);
640 drq = &(*crpc)->crp_rpc->crpc_reqstmsg.msg_body.dbg_reqst;
642 drq->dbg_sid = console_session.ses_id;
649 lstcon_batrpc_prep(struct lstcon_node *nd, int transop, unsigned int feats,
650 struct lstcon_tsb_hdr *tsb, struct lstcon_rpc **crpc)
652 struct lstcon_batch *batch;
653 struct srpc_batch_reqst *brq;
656 rc = lstcon_rpc_prep(nd, SRPC_SERVICE_BATCH, feats, 0, 0, crpc);
660 brq = &(*crpc)->crp_rpc->crpc_reqstmsg.msg_body.bat_reqst;
662 brq->bar_sid = console_session.ses_id;
663 brq->bar_bid = tsb->tsb_id;
664 brq->bar_testidx = tsb->tsb_index;
665 brq->bar_opc = transop == LST_TRANS_TSBRUN ? SRPC_BATCH_OPC_RUN :
666 (transop == LST_TRANS_TSBSTOP ? SRPC_BATCH_OPC_STOP :
667 SRPC_BATCH_OPC_QUERY);
669 if (transop != LST_TRANS_TSBRUN &&
670 transop != LST_TRANS_TSBSTOP)
673 LASSERT(!tsb->tsb_index);
675 batch = (struct lstcon_batch *)tsb;
676 brq->bar_arg = batch->bat_arg;
682 lstcon_statrpc_prep(struct lstcon_node *nd, unsigned int feats,
683 struct lstcon_rpc **crpc)
685 struct srpc_stat_reqst *srq;
688 rc = lstcon_rpc_prep(nd, SRPC_SERVICE_QUERY_STAT, feats, 0, 0, crpc);
692 srq = &(*crpc)->crp_rpc->crpc_reqstmsg.msg_body.stat_reqst;
694 srq->str_sid = console_session.ses_id;
695 srq->str_type = 0; /* XXX remove it */
700 static struct lnet_process_id_packed *
701 lstcon_next_id(int idx, int nkiov, struct bio_vec *kiov)
703 struct lnet_process_id_packed *pid;
706 i = idx / SFW_ID_PER_PAGE;
710 pid = (struct lnet_process_id_packed *)page_address(kiov[i].bv_page);
712 return &pid[idx % SFW_ID_PER_PAGE];
716 lstcon_dstnodes_prep(struct lstcon_group *grp, int idx,
717 int dist, int span, int nkiov, struct bio_vec *kiov)
719 struct lnet_process_id_packed *pid;
720 struct lstcon_ndlink *ndl;
721 struct lstcon_node *nd;
728 LASSERT(grp->grp_nnode >= 1);
730 if (span > grp->grp_nnode)
733 start = ((idx / dist) * span) % grp->grp_nnode;
734 end = ((idx / dist) * span + span - 1) % grp->grp_nnode;
736 list_for_each_entry(ndl, &grp->grp_ndl_list, ndl_link) {
743 if (i > (end >= start ? end : grp->grp_nnode))
746 pid = lstcon_next_id((i - start), nkiov, kiov);
747 pid->nid = nd->nd_id.nid;
748 pid->pid = nd->nd_id.pid;
752 if (start <= end) /* done */
755 list_for_each_entry(ndl, &grp->grp_ndl_list, ndl_link) {
756 if (i > grp->grp_nnode + end)
760 pid = lstcon_next_id((i - start), nkiov, kiov);
761 pid->nid = nd->nd_id.nid;
762 pid->pid = nd->nd_id.pid;
770 lstcon_pingrpc_prep(struct lst_test_ping_param *param, struct srpc_test_reqst *req)
772 struct test_ping_req *prq = &req->tsr_u.ping;
774 prq->png_size = param->png_size;
775 prq->png_flags = param->png_flags;
781 lstcon_bulkrpc_v0_prep(struct lst_test_bulk_param *param,
782 struct srpc_test_reqst *req)
784 struct test_bulk_req *brq = &req->tsr_u.bulk_v0;
786 brq->blk_opc = param->blk_opc;
787 brq->blk_npg = DIV_ROUND_UP(param->blk_size, PAGE_SIZE);
788 brq->blk_flags = param->blk_flags;
794 lstcon_bulkrpc_v1_prep(struct lst_test_bulk_param *param, bool is_client,
795 struct srpc_test_reqst *req)
797 struct test_bulk_req_v1 *brq = &req->tsr_u.bulk_v1;
799 brq->blk_opc = param->blk_opc;
800 brq->blk_flags = param->blk_flags;
801 brq->blk_len = param->blk_size;
802 brq->blk_offset = is_client ? param->blk_cli_off : param->blk_srv_off;
808 lstcon_testrpc_prep(struct lstcon_node *nd, int transop, unsigned int feats,
809 struct lstcon_test *test, struct lstcon_rpc **crpc)
811 struct lstcon_group *sgrp = test->tes_src_grp;
812 struct lstcon_group *dgrp = test->tes_dst_grp;
813 struct srpc_test_reqst *trq;
814 struct srpc_bulk *bulk;
820 if (transop == LST_TRANS_TSBCLIADD) {
821 npg = sfw_id_pages(test->tes_span);
822 nob = !(feats & LST_FEAT_BULK_LEN) ?
824 sizeof(struct lnet_process_id_packed) * test->tes_span;
827 rc = lstcon_rpc_prep(nd, SRPC_SERVICE_TEST, feats, npg, nob, crpc);
831 trq = &(*crpc)->crp_rpc->crpc_reqstmsg.msg_body.tes_reqst;
833 if (transop == LST_TRANS_TSBSRVADD) {
834 int ndist = DIV_ROUND_UP(sgrp->grp_nnode, test->tes_dist);
835 int nspan = DIV_ROUND_UP(dgrp->grp_nnode, test->tes_span);
836 int nmax = DIV_ROUND_UP(ndist, nspan);
839 trq->tsr_loop = nmax * test->tes_dist * test->tes_concur;
841 bulk = &(*crpc)->crp_rpc->crpc_bulk;
843 for (i = 0; i < npg; i++) {
848 len = !(feats & LST_FEAT_BULK_LEN) ?
850 min_t(int, nob, PAGE_SIZE);
853 bulk->bk_iovs[i].bv_offset = 0;
854 bulk->bk_iovs[i].bv_len = len;
855 bulk->bk_iovs[i].bv_page = alloc_page(GFP_KERNEL);
857 if (!bulk->bk_iovs[i].bv_page) {
858 lstcon_rpc_put(*crpc);
865 LASSERT(transop == LST_TRANS_TSBCLIADD);
867 rc = lstcon_dstnodes_prep(test->tes_dst_grp,
871 npg, &bulk->bk_iovs[0]);
873 lstcon_rpc_put(*crpc);
877 trq->tsr_ndest = test->tes_span;
878 trq->tsr_loop = test->tes_loop;
881 trq->tsr_sid = console_session.ses_id;
882 trq->tsr_bid = test->tes_hdr.tsb_id;
883 trq->tsr_concur = test->tes_concur;
884 trq->tsr_is_client = (transop == LST_TRANS_TSBCLIADD) ? 1 : 0;
885 trq->tsr_stop_onerr = !!test->tes_stop_onerr;
887 switch (test->tes_type) {
889 trq->tsr_service = SRPC_SERVICE_PING;
890 rc = lstcon_pingrpc_prep((struct lst_test_ping_param *)
891 &test->tes_param[0], trq);
895 trq->tsr_service = SRPC_SERVICE_BRW;
896 if (!(feats & LST_FEAT_BULK_LEN)) {
897 rc = lstcon_bulkrpc_v0_prep((struct lst_test_bulk_param *)
898 &test->tes_param[0], trq);
900 rc = lstcon_bulkrpc_v1_prep((struct lst_test_bulk_param *)
902 trq->tsr_is_client, trq);
915 lstcon_sesnew_stat_reply(struct lstcon_rpc_trans *trans,
916 struct lstcon_node *nd, struct srpc_msg *reply)
918 struct srpc_mksn_reply *mksn_rep = &reply->msg_body.mksn_reply;
919 int status = mksn_rep->mksn_status;
922 (reply->msg_ses_feats & ~LST_FEATS_MASK)) {
923 mksn_rep->mksn_status = EPROTO;
927 if (status == EPROTO) {
928 CNETERR("session protocol error from %s: %u\n",
929 libcfs_nid2str(nd->nd_id.nid),
930 reply->msg_ses_feats);
936 if (!trans->tas_feats_updated) {
937 spin_lock(&console_session.ses_rpc_lock);
938 if (!trans->tas_feats_updated) { /* recheck with lock */
939 trans->tas_feats_updated = 1;
940 trans->tas_features = reply->msg_ses_feats;
942 spin_unlock(&console_session.ses_rpc_lock);
945 if (reply->msg_ses_feats != trans->tas_features) {
946 CNETERR("Framework features %x from %s is different with features on this transaction: %x\n",
947 reply->msg_ses_feats, libcfs_nid2str(nd->nd_id.nid),
948 trans->tas_features);
949 mksn_rep->mksn_status = EPROTO;
954 /* session timeout on remote node */
955 nd->nd_timeout = mksn_rep->mksn_timeout;
962 lstcon_rpc_stat_reply(struct lstcon_rpc_trans *trans, struct srpc_msg *msg,
963 struct lstcon_node *nd, struct lstcon_trans_stat *stat)
965 struct srpc_rmsn_reply *rmsn_rep;
966 struct srpc_debug_reply *dbg_rep;
967 struct srpc_batch_reply *bat_rep;
968 struct srpc_test_reply *test_rep;
969 struct srpc_stat_reply *stat_rep;
972 switch (trans->tas_opc) {
973 case LST_TRANS_SESNEW:
974 rc = lstcon_sesnew_stat_reply(trans, nd, msg);
976 lstcon_sesop_stat_success(stat, 1);
980 lstcon_sesop_stat_failure(stat, 1);
983 case LST_TRANS_SESEND:
984 rmsn_rep = &msg->msg_body.rmsn_reply;
985 /* ESRCH is not an error for end session */
986 if (!rmsn_rep->rmsn_status ||
987 rmsn_rep->rmsn_status == ESRCH) {
988 lstcon_sesop_stat_success(stat, 1);
992 lstcon_sesop_stat_failure(stat, 1);
993 rc = rmsn_rep->rmsn_status;
996 case LST_TRANS_SESQRY:
997 case LST_TRANS_SESPING:
998 dbg_rep = &msg->msg_body.dbg_reply;
1000 if (dbg_rep->dbg_status == ESRCH) {
1001 lstcon_sesqry_stat_unknown(stat, 1);
1005 if (lstcon_session_match(dbg_rep->dbg_sid))
1006 lstcon_sesqry_stat_active(stat, 1);
1008 lstcon_sesqry_stat_busy(stat, 1);
1011 case LST_TRANS_TSBRUN:
1012 case LST_TRANS_TSBSTOP:
1013 bat_rep = &msg->msg_body.bat_reply;
1015 if (!bat_rep->bar_status) {
1016 lstcon_tsbop_stat_success(stat, 1);
1020 if (bat_rep->bar_status == EPERM &&
1021 trans->tas_opc == LST_TRANS_TSBSTOP) {
1022 lstcon_tsbop_stat_success(stat, 1);
1026 lstcon_tsbop_stat_failure(stat, 1);
1027 rc = bat_rep->bar_status;
1030 case LST_TRANS_TSBCLIQRY:
1031 case LST_TRANS_TSBSRVQRY:
1032 bat_rep = &msg->msg_body.bat_reply;
1034 if (bat_rep->bar_active)
1035 lstcon_tsbqry_stat_run(stat, 1);
1037 lstcon_tsbqry_stat_idle(stat, 1);
1039 if (!bat_rep->bar_status)
1042 lstcon_tsbqry_stat_failure(stat, 1);
1043 rc = bat_rep->bar_status;
1046 case LST_TRANS_TSBCLIADD:
1047 case LST_TRANS_TSBSRVADD:
1048 test_rep = &msg->msg_body.tes_reply;
1050 if (!test_rep->tsr_status) {
1051 lstcon_tsbop_stat_success(stat, 1);
1055 lstcon_tsbop_stat_failure(stat, 1);
1056 rc = test_rep->tsr_status;
1059 case LST_TRANS_STATQRY:
1060 stat_rep = &msg->msg_body.stat_reply;
1062 if (!stat_rep->str_status) {
1063 lstcon_statqry_stat_success(stat, 1);
1067 lstcon_statqry_stat_failure(stat, 1);
1068 rc = stat_rep->str_status;
1075 if (!stat->trs_fwk_errno)
1076 stat->trs_fwk_errno = rc;
1080 lstcon_rpc_trans_ndlist(struct list_head *ndlist,
1081 struct list_head *translist, int transop,
1082 void *arg, lstcon_rpc_cond_func_t condition,
1083 struct lstcon_rpc_trans **transpp)
1085 struct lstcon_rpc_trans *trans;
1086 struct lstcon_ndlink *ndl;
1087 struct lstcon_node *nd;
1088 struct lstcon_rpc *rpc;
1092 /* Creating session RPG for list of nodes */
1094 rc = lstcon_rpc_trans_prep(translist, transop, &trans);
1096 CERROR("Can't create transaction %d: %d\n", transop, rc);
1100 feats = trans->tas_features;
1101 list_for_each_entry(ndl, ndlist, ndl_link) {
1102 rc = !condition ? 1 :
1103 condition(transop, ndl->ndl_node, arg);
1109 CDEBUG(D_NET, "Condition error while creating RPC for transaction %d: %d\n",
1117 case LST_TRANS_SESNEW:
1118 case LST_TRANS_SESEND:
1119 rc = lstcon_sesrpc_prep(nd, transop, feats, &rpc);
1121 case LST_TRANS_SESQRY:
1122 case LST_TRANS_SESPING:
1123 rc = lstcon_dbgrpc_prep(nd, feats, &rpc);
1125 case LST_TRANS_TSBCLIADD:
1126 case LST_TRANS_TSBSRVADD:
1127 rc = lstcon_testrpc_prep(nd, transop, feats,
1128 (struct lstcon_test *)arg,
1131 case LST_TRANS_TSBRUN:
1132 case LST_TRANS_TSBSTOP:
1133 case LST_TRANS_TSBCLIQRY:
1134 case LST_TRANS_TSBSRVQRY:
1135 rc = lstcon_batrpc_prep(nd, transop, feats,
1136 (struct lstcon_tsb_hdr *)arg,
1139 case LST_TRANS_STATQRY:
1140 rc = lstcon_statrpc_prep(nd, feats, &rpc);
1148 CERROR("Failed to create RPC for transaction %s: %d\n",
1149 lstcon_rpc_trans_name(transop), rc);
1153 lstcon_rpc_trans_addreq(trans, rpc);
1161 lstcon_rpc_trans_destroy(trans);
1167 lstcon_rpc_pinger(void *arg)
1169 struct stt_timer *ptimer = (struct stt_timer *)arg;
1170 struct lstcon_rpc_trans *trans;
1171 struct lstcon_rpc *crpc;
1172 struct srpc_msg *rep;
1173 struct srpc_debug_reqst *drq;
1174 struct lstcon_ndlink *ndl;
1175 struct lstcon_node *nd;
1181 * RPC pinger is a special case of transaction,
1182 * it's called by timer at 8 seconds interval.
1184 mutex_lock(&console_session.ses_mutex);
1186 if (console_session.ses_shutdown || console_session.ses_expired) {
1187 mutex_unlock(&console_session.ses_mutex);
1191 if (!console_session.ses_expired &&
1192 ktime_get_real_seconds() - console_session.ses_laststamp >
1193 (time64_t)console_session.ses_timeout)
1194 console_session.ses_expired = 1;
1196 trans = console_session.ses_ping;
1200 list_for_each_entry(ndl, &console_session.ses_ndl_list, ndl_link) {
1203 if (console_session.ses_expired) {
1204 /* idle console, end session on all nodes */
1205 if (nd->nd_state != LST_NODE_ACTIVE)
1208 rc = lstcon_sesrpc_prep(nd, LST_TRANS_SESEND,
1209 trans->tas_features, &crpc);
1211 CERROR("Out of memory\n");
1215 lstcon_rpc_trans_addreq(trans, crpc);
1216 lstcon_rpc_post(crpc);
1221 crpc = &nd->nd_ping;
1223 if (crpc->crp_rpc) {
1224 LASSERT(crpc->crp_trans == trans);
1225 LASSERT(!list_empty(&crpc->crp_link));
1227 spin_lock(&crpc->crp_rpc->crpc_lock);
1229 LASSERT(crpc->crp_posted);
1231 if (!crpc->crp_finished) {
1233 spin_unlock(&crpc->crp_rpc->crpc_lock);
1237 spin_unlock(&crpc->crp_rpc->crpc_lock);
1239 lstcon_rpc_get_reply(crpc, &rep);
1241 list_del_init(&crpc->crp_link);
1243 lstcon_rpc_put(crpc);
1246 if (nd->nd_state != LST_NODE_ACTIVE)
1249 intv = (jiffies - nd->nd_stamp) / msecs_to_jiffies(MSEC_PER_SEC);
1250 if (intv < nd->nd_timeout / 2)
1253 rc = lstcon_rpc_init(nd, SRPC_SERVICE_DEBUG,
1254 trans->tas_features, 0, 0, 1, crpc);
1256 CERROR("Out of memory\n");
1260 drq = &crpc->crp_rpc->crpc_reqstmsg.msg_body.dbg_reqst;
1262 drq->dbg_sid = console_session.ses_id;
1265 lstcon_rpc_trans_addreq(trans, crpc);
1266 lstcon_rpc_post(crpc);
1271 if (console_session.ses_expired) {
1272 mutex_unlock(&console_session.ses_mutex);
1276 CDEBUG(D_NET, "Ping %d nodes in session\n", count);
1278 ptimer->stt_expires = ktime_get_real_seconds() + LST_PING_INTERVAL;
1279 stt_add_timer(ptimer);
1281 mutex_unlock(&console_session.ses_mutex);
1285 lstcon_rpc_pinger_start(void)
1287 struct stt_timer *ptimer;
1290 LASSERT(list_empty(&console_session.ses_rpc_freelist));
1291 LASSERT(!atomic_read(&console_session.ses_rpc_counter));
1293 rc = lstcon_rpc_trans_prep(NULL, LST_TRANS_SESPING,
1294 &console_session.ses_ping);
1296 CERROR("Failed to create console pinger\n");
1300 ptimer = &console_session.ses_ping_timer;
1301 ptimer->stt_expires = ktime_get_real_seconds() + LST_PING_INTERVAL;
1303 stt_add_timer(ptimer);
1309 lstcon_rpc_pinger_stop(void)
1311 LASSERT(console_session.ses_shutdown);
1313 stt_del_timer(&console_session.ses_ping_timer);
1315 lstcon_rpc_trans_abort(console_session.ses_ping, -ESHUTDOWN);
1316 lstcon_rpc_trans_stat(console_session.ses_ping, lstcon_trans_stat());
1317 lstcon_rpc_trans_destroy(console_session.ses_ping);
1319 memset(lstcon_trans_stat(), 0, sizeof(struct lstcon_trans_stat));
1321 console_session.ses_ping = NULL;
1325 lstcon_rpc_cleanup_wait(void)
1327 struct lstcon_rpc_trans *trans;
1328 struct lstcon_rpc *crpc;
1329 struct lstcon_rpc *temp;
1330 struct list_head *pacer;
1331 struct list_head zlist;
1333 /* Called with hold of global mutex */
1335 LASSERT(console_session.ses_shutdown);
1337 while (!list_empty(&console_session.ses_trans_list)) {
1338 list_for_each(pacer, &console_session.ses_trans_list) {
1339 trans = list_entry(pacer, struct lstcon_rpc_trans,
1342 CDEBUG(D_NET, "Session closed, wakeup transaction %s\n",
1343 lstcon_rpc_trans_name(trans->tas_opc));
1345 wake_up(&trans->tas_waitq);
1348 mutex_unlock(&console_session.ses_mutex);
1350 CWARN("Session is shutting down, waiting for termination of transactions\n");
1351 set_current_state(TASK_UNINTERRUPTIBLE);
1352 schedule_timeout(cfs_time_seconds(1));
1354 mutex_lock(&console_session.ses_mutex);
1357 spin_lock(&console_session.ses_rpc_lock);
1359 lst_wait_until(!atomic_read(&console_session.ses_rpc_counter),
1360 console_session.ses_rpc_lock,
1361 "Network is not accessible or target is down, waiting for %d console RPCs to being recycled\n",
1362 atomic_read(&console_session.ses_rpc_counter));
1364 list_add(&zlist, &console_session.ses_rpc_freelist);
1365 list_del_init(&console_session.ses_rpc_freelist);
1367 spin_unlock(&console_session.ses_rpc_lock);
1369 list_for_each_entry_safe(crpc, temp, &zlist, crp_link) {
1370 list_del(&crpc->crp_link);
1371 LIBCFS_FREE(crpc, sizeof(struct lstcon_rpc));
1376 lstcon_rpc_module_init(void)
1378 INIT_LIST_HEAD(&console_session.ses_ping_timer.stt_list);
1379 console_session.ses_ping_timer.stt_func = lstcon_rpc_pinger;
1380 console_session.ses_ping_timer.stt_data = &console_session.ses_ping_timer;
1382 console_session.ses_ping = NULL;
1384 spin_lock_init(&console_session.ses_rpc_lock);
1385 atomic_set(&console_session.ses_rpc_counter, 0);
1386 INIT_LIST_HEAD(&console_session.ses_rpc_freelist);
1392 lstcon_rpc_module_fini(void)
1394 LASSERT(list_empty(&console_session.ses_rpc_freelist));
1395 LASSERT(!atomic_read(&console_session.ses_rpc_counter));