From: Hal Rosenstock <hal-LDSdmyG8hGV8YrgS2mwiifqBs+8SCbDb@public.gmane.org>
To: Dan Ben Yosef <danby-VPRAkNaXOzVWk0Htik3J/w@public.gmane.org>
Cc: Ira Weiny <weiny2-i2BcT+NCU+M@public.gmane.org>,
linux-rdma-u79uwXL29TY76Z2rM5mHXA@public.gmane.org
Subject: Re: [PATCHv3] infiniband-diags/ibqueryerrors.c: obtain destination sl before perf query
Date: Thu, 28 Feb 2013 11:11:15 -0500 [thread overview]
Message-ID: <512F81A3.6000100@dev.mellanox.co.il> (raw)
In-Reply-To: <20130227141032.GA9919-Kyg1NGsloJ8bMuq+TCmafCexzy7lsfyC@public.gmane.org>
On 2/27/2013 9:10 AM, Dan Ben Yosef wrote:
> 1) if use -G or -D option : we obtain sl before doing perf query.
> 2) if no destination is given : we obtain sl for every pair source-destination.
> 3) if no destination is given and use --skip-sl option : we don't obtain
> sl to all nodes in the fabric,in this case sl=0 for all node pairs.
It might be noted that this is not recommended in the case of QoS aware
routing engines as this can cause credit deadlock.
>
> Signed-off-by: Dan Ben Yosef <danby-VPRAkNaXOzVWk0Htik3J/w@public.gmane.org>
> ---
> Changes since v2:
> 1.Skip-sl option will apply to 1 and 2.
> 2.Update documentation doc/rst/ibqueryerrors.8.in.rst
> 3.Pop the resolve_self call to be before the check for dr_path.
> 4.Add new variable self_portid for the usage of resolve_self only.
> 5.Change "goto close_port" into "goto destroy_fabric" if fabric object
> is created.
>
> doc/rst/ibqueryerrors.8.in.rst | 2 +
> src/ibqueryerrors.c | 81 +++++++++++++++++++++++++++++++++++++++-
> 2 files changed, 81 insertions(+), 2 deletions(-)
>
> diff --git a/doc/rst/ibqueryerrors.8.in.rst b/doc/rst/ibqueryerrors.8.in.rst
> index 9a05e7b..b910368 100644
> --- a/doc/rst/ibqueryerrors.8.in.rst
> +++ b/doc/rst/ibqueryerrors.8.in.rst
> @@ -52,6 +52,8 @@ Specify an alternate threshold file. The default is @IBDIAG_CONFIG_PATH@/error_
>
> **--ca** print data for CA's only
>
> +**--skip-sl** Use the default sl for queries
> +
> **--router** print data for routers only
>
> **--clear-errors -k** Clear error counters after read.
> diff --git a/src/ibqueryerrors.c b/src/ibqueryerrors.c
> index 6320972..6d17497 100644
> --- a/src/ibqueryerrors.c
> +++ b/src/ibqueryerrors.c
> @@ -55,11 +55,14 @@
> #include <infiniband/mad.h>
>
> #include "ibdiag_common.h"
> +#include "ibdiag_sa.h"
>
> struct ibmad_port *ibmad_port;
> static char *node_name_map_file = NULL;
> static nn_map_t *node_name_map = NULL;
> static char *load_cache_file = NULL;
> +static uint16_t lid2sl_table[sizeof(uint8_t) * 1024 * 48] = { 0 };
> +static int obtain_sl = 1;
>
> int data_counters = 0;
> int data_counters_only = 0;
> @@ -78,6 +81,8 @@ unsigned clear_errors = 0, clear_counts = 0, details = 0;
> #define PRINT_ROUTER 0x4
> #define PRINT_ALL 0xFF /* all nodes default flag */
>
> +#define DEFAULT_HALF_WORLD_PR_TIMEOUT (3000)
> +
> struct {
> int nodes_checked;
> int bad_nodes;
> @@ -298,6 +303,51 @@ static int print_summary(void)
> return (summary.bad_ports);
> }
>
> +static void insert_lid2sl_table(struct sa_query_result *r)
> +{
> + unsigned int i;
> + for (i = 0; i < r->result_cnt; i++) {
> + ib_path_rec_t *p_pr = (ib_path_rec_t *)sa_get_query_rec(r->p_result_madw, i);
> + lid2sl_table[cl_ntoh16(p_pr->dlid)] = ib_path_rec_sl(p_pr);
> + }
> +}
> +
> +static int path_record_query(int src_lid,int dest_lid)
> +{
> + ib_path_rec_t pr;
> + ib_net64_t comp_mask = 0;
> + uint8_t reversible = 0;
> + struct sa_handle * h;
> +
> + h = sa_get_handle();
> + ibd_timeout = DEFAULT_HALF_WORLD_PR_TIMEOUT;
> + memset(&pr, 0, sizeof(pr));
> +
> + CHECK_AND_SET_VAL(src_lid, 16, 0, pr.slid, PR, SLID);
Doesn't SGID rather than SLID need to be specified to be compliant
GetTable query ?
> + CHECK_AND_SET_VAL(dest_lid, 16, 0, pr.dlid, PR, DLID);/*if dlid is 0 then we do half world query*/
I think this should be:
if (dest_lid)
CHECK_AND_SET_VAL(dest_lid, 16, 0, pr.dlid, PR, DLID);
so that comp mask bit is not set for DLID so that it's wildcarded.
> + CHECK_AND_SET_VAL(1, 8, -1, pr.num_path, PR, NUMBPATH);/*to get only one PathRecord for each source and destination pair*/
> + CHECK_AND_SET_VAL(1, 8, -1, reversible, PR, REVERSIBLE);/*for a reversible path*/
> + pr.num_path |= reversible << 7;
> + struct sa_query_result result;
> + int ret = sa_query(h, IB_MAD_METHOD_GET_TABLE,
> + (uint16_t)IB_SA_ATTR_PATHRECORD,0,cl_ntoh64(comp_mask),ibd_sakey,
> + &pr, sizeof(pr), &result);
> + if (ret) {
> + fprintf(stderr, "Query SA failed: %s; sa call path_query failed\n", strerror(ret));
> + return ret;
> + }
> + if (result.status != IB_SA_MAD_STATUS_SUCCESS) {
> + sa_report_err(result.status);
> + ret = EIO;
> + goto Exit;
> + }
> +
> + insert_lid2sl_table(&result);
> +Exit:
> + sa_free_result_mad(&result);
> + return ret;
> +}
> +
> static int query_and_dump(char *buf, size_t size, ib_portid_t * portid,
> ibnd_node_t * node, char *node_name, int portnum,
> const char *attr_name, uint16_t attr_id,
> @@ -447,6 +497,8 @@ static int query_cap_mask(ib_portid_t * portid, char *node_name, int portnum,
> uint8_t pc[1024] = { 0 };
> uint16_t rc_cap_mask;
>
> + portid->sl = lid2sl_table[portid->lid];
> +
> /* PerfMgt ClassPortInfo is a required attribute */
> if (!pma_query_via(pc, portid, portnum, ibd_timeout, CLASS_PORT_INFO,
> ibmad_port)) {
> @@ -474,6 +526,8 @@ static int print_data_cnts(ib_portid_t * portid, uint16_t cap_mask,
>
> memset(pc, 0, 1024);
>
> + portid->sl = lid2sl_table[portid->lid];
> +
> if (cap_mask & (IB_PM_EXT_WIDTH_SUPPORTED | IB_PM_EXT_WIDTH_NOIETF_SUP)) {
> if (!pma_query_via(pc, portid, portnum, ibd_timeout,
> IB_GSI_PORT_COUNTERS_EXT, ibmad_port)) {
> @@ -543,6 +597,8 @@ static int print_errors(ib_portid_t * portid, uint16_t cap_mask,
> memset(pc, 0, 1024);
> memset(pce, 0, 1024);
>
> + portid->sl = lid2sl_table[portid->lid];
> +
> if (!pma_query_via(pc, portid, portnum, ibd_timeout,
> IB_GSI_PORT_COUNTERS, ibmad_port)) {
> IBWARN("IB_GSI_PORT_COUNTERS query failed on %s, %s port %d",
> @@ -822,6 +878,9 @@ static int process_opt(void *context, int ch, char *optarg)
> case 9:
> data_counters_only = 1;
> break;
> + case 10:
> + obtain_sl = 0;
> + break;
> case 'G':
> case 'S':
> port_guid_str = optarg;
> @@ -856,8 +915,11 @@ int main(int argc, char **argv)
> struct ibnd_config config = { 0 };
> int resolved = -1;
> ib_portid_t portid = { 0 };
> + ib_portid_t self_portid = { 0 };
> int rc = 0;
> ibnd_fabric_t *fabric = NULL;
> + int self_lid = 0;
> + int port = 0;
>
> int mgmt_classes[4] = { IB_SMI_CLASS, IB_SMI_DIRECT_CLASS, IB_SA_CLASS,
> IB_PERFORMANCE_CLASS
> @@ -875,6 +937,7 @@ int main(int argc, char **argv)
> "Same as \"-G\" for backward compatibility"},
> {"Direct", 'D', 1, "<dr_path>",
> "report the node containing the port specified by <dr_path>"},
> + {"skip-sl", 10, 0, NULL,"don't obtain SL to all destinations"},
> {"report-port", 'r', 0, NULL,
> "report port link information"},
> {"threshold-file", 8, 1, NULL,
> @@ -931,6 +994,12 @@ int main(int argc, char **argv)
> exit(-1);
> }
>
> + if (resolve_self(ibd_ca, ibd_ca_port, &self_portid, &port, 0) < 0) {
resolve_self is deprecated; should use resolve_self_via
-- Hal
> + IBERROR("can't resolve self port %s", argv[0]);
> + goto close_port;
> + }
> + self_lid = self_portid.lid;
> +
> /* limit the scan the fabric around the target */
> if (dr_path) {
> if ((resolved =
> @@ -947,6 +1016,8 @@ int main(int argc, char **argv)
> IBWARN("Failed to resolve %s;",port_guid_str);
> goto close_port;
> }
> + if(obtain_sl)
> + lid2sl_table[portid.lid] = portid.sl;
> }
>
> if (load_cache_file) {
> @@ -996,12 +1067,18 @@ int main(int argc, char **argv)
>
> port = ibnd_find_port_guid(fabric, port_guid);
> if (port) {
> + if(obtain_sl)
> + if(path_record_query(self_lid,port->base_lid))
> + goto destroy_fabric;
> print_node(port->node, NULL);
> } else
> fprintf(stderr, "Failed to find node: %s\n", dr_path);
> - } else
> + } else {
> + if(obtain_sl)
> + if(path_record_query(self_lid,0))
> + goto destroy_fabric;
> ibnd_iter_nodes(fabric, print_node, NULL);
> -
> + }
> rc = print_summary();
> if (rc)
> rc = 1;
--
To unsubscribe from this list: send the line "unsubscribe linux-rdma" in
the body of a message to majordomo-u79uwXL29TY76Z2rM5mHXA@public.gmane.org
More majordomo info at http://vger.kernel.org/majordomo-info.html
next prev parent reply other threads:[~2013-02-28 16:11 UTC|newest]
Thread overview: 10+ messages / expand[flat|nested] mbox.gz Atom feed top
2013-02-20 11:58 [PATCH]: infiniband-diags/ibqueryerrors.c: obtain destination sl before perf query Dan Ben Yosef
[not found] ` <20130220115807.GC20018-Kyg1NGsloJ/nXW+7WiO5SxL4W9x8LtSr@public.gmane.org>
2013-02-20 18:46 ` Ira Weiny
2013-02-24 8:21 ` [PATCHv2] " Dan Ben Yosef
[not found] ` <20130224082140.GA11648-Kyg1NGsloJ/nXW+7WiO5SxL4W9x8LtSr@public.gmane.org>
2013-02-27 1:07 ` Ira Weiny
[not found] ` <20130226170744.53adb74b6af9a54d9481dd4c-i2BcT+NCU+M@public.gmane.org>
2013-02-27 14:10 ` [PATCHv3] " Dan Ben Yosef
[not found] ` <20130227141032.GA9919-Kyg1NGsloJ8bMuq+TCmafCexzy7lsfyC@public.gmane.org>
2013-02-28 16:11 ` Hal Rosenstock [this message]
[not found] ` <512F81A3.6000100-LDSdmyG8hGV8YrgS2mwiifqBs+8SCbDb@public.gmane.org>
2013-03-01 1:33 ` Ira Weiny
[not found] ` <20130228173336.18bc61527d20d160c9f39818-i2BcT+NCU+M@public.gmane.org>
2013-03-14 14:09 ` [PATCHv4] " Dan Ben Yosef
[not found] ` <20130314140902.GA10423-Kyg1NGsloJ8bMuq+TCmafCexzy7lsfyC@public.gmane.org>
2013-03-14 14:52 ` [PATCHv5] " Dan Ben Yosef
[not found] ` <20130314145246.GA13095-Kyg1NGsloJ8bMuq+TCmafCexzy7lsfyC@public.gmane.org>
2013-03-18 20:34 ` Ira Weiny
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=512F81A3.6000100@dev.mellanox.co.il \
--to=hal-ldsdmyg8hgv8yrgs2mwiifqbs+8scbdb@public.gmane.org \
--cc=danby-VPRAkNaXOzVWk0Htik3J/w@public.gmane.org \
--cc=linux-rdma-u79uwXL29TY76Z2rM5mHXA@public.gmane.org \
--cc=weiny2-i2BcT+NCU+M@public.gmane.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox