GNU Linux-libre 4.9.287-gnu1
[releases.git] / drivers / infiniband / hw / qib / qib_driver.c
1 /*
2  * Copyright (c) 2013 Intel Corporation. All rights reserved.
3  * Copyright (c) 2006, 2007, 2008, 2009 QLogic Corporation. All rights reserved.
4  * Copyright (c) 2003, 2004, 2005, 2006 PathScale, Inc. All rights reserved.
5  *
6  * This software is available to you under a choice of one of two
7  * licenses.  You may choose to be licensed under the terms of the GNU
8  * General Public License (GPL) Version 2, available from the file
9  * COPYING in the main directory of this source tree, or the
10  * OpenIB.org BSD license below:
11  *
12  *     Redistribution and use in source and binary forms, with or
13  *     without modification, are permitted provided that the following
14  *     conditions are met:
15  *
16  *      - Redistributions of source code must retain the above
17  *        copyright notice, this list of conditions and the following
18  *        disclaimer.
19  *
20  *      - Redistributions in binary form must reproduce the above
21  *        copyright notice, this list of conditions and the following
22  *        disclaimer in the documentation and/or other materials
23  *        provided with the distribution.
24  *
25  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
26  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
27  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
28  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
29  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
30  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
31  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
32  * SOFTWARE.
33  */
34
35 #include <linux/spinlock.h>
36 #include <linux/pci.h>
37 #include <linux/io.h>
38 #include <linux/delay.h>
39 #include <linux/netdevice.h>
40 #include <linux/vmalloc.h>
41 #include <linux/module.h>
42 #include <linux/prefetch.h>
43
44 #include "qib.h"
45
46 /*
47  * The size has to be longer than this string, so we can append
48  * board/chip information to it in the init code.
49  */
50 const char ib_qib_version[] = QIB_DRIVER_VERSION "\n";
51
52 DEFINE_SPINLOCK(qib_devs_lock);
53 LIST_HEAD(qib_dev_list);
54 DEFINE_MUTEX(qib_mutex);        /* general driver use */
55
56 unsigned qib_ibmtu;
57 module_param_named(ibmtu, qib_ibmtu, uint, S_IRUGO);
58 MODULE_PARM_DESC(ibmtu, "Set max IB MTU (0=2KB, 1=256, 2=512, ... 5=4096");
59
60 unsigned qib_compat_ddr_negotiate = 1;
61 module_param_named(compat_ddr_negotiate, qib_compat_ddr_negotiate, uint,
62                    S_IWUSR | S_IRUGO);
63 MODULE_PARM_DESC(compat_ddr_negotiate,
64                  "Attempt pre-IBTA 1.2 DDR speed negotiation");
65
66 MODULE_LICENSE("Dual BSD/GPL");
67 MODULE_AUTHOR("Intel <ibsupport@intel.com>");
68 MODULE_DESCRIPTION("Intel IB driver");
69 MODULE_VERSION(QIB_DRIVER_VERSION);
70
71 /*
72  * QIB_PIO_MAXIBHDR is the max IB header size allowed for in our
73  * PIO send buffers.  This is well beyond anything currently
74  * defined in the InfiniBand spec.
75  */
76 #define QIB_PIO_MAXIBHDR 128
77
78 /*
79  * QIB_MAX_PKT_RCV is the max # if packets processed per receive interrupt.
80  */
81 #define QIB_MAX_PKT_RECV 64
82
83 struct qlogic_ib_stats qib_stats;
84
85 const char *qib_get_unit_name(int unit)
86 {
87         static char iname[16];
88
89         snprintf(iname, sizeof(iname), "infinipath%u", unit);
90         return iname;
91 }
92
93 const char *qib_get_card_name(struct rvt_dev_info *rdi)
94 {
95         struct qib_ibdev *ibdev = container_of(rdi, struct qib_ibdev, rdi);
96         struct qib_devdata *dd = container_of(ibdev,
97                                               struct qib_devdata, verbs_dev);
98         return qib_get_unit_name(dd->unit);
99 }
100
101 struct pci_dev *qib_get_pci_dev(struct rvt_dev_info *rdi)
102 {
103         struct qib_ibdev *ibdev = container_of(rdi, struct qib_ibdev, rdi);
104         struct qib_devdata *dd = container_of(ibdev,
105                                               struct qib_devdata, verbs_dev);
106         return dd->pcidev;
107 }
108
109 /*
110  * Return count of units with at least one port ACTIVE.
111  */
112 int qib_count_active_units(void)
113 {
114         struct qib_devdata *dd;
115         struct qib_pportdata *ppd;
116         unsigned long flags;
117         int pidx, nunits_active = 0;
118
119         spin_lock_irqsave(&qib_devs_lock, flags);
120         list_for_each_entry(dd, &qib_dev_list, list) {
121                 if (!(dd->flags & QIB_PRESENT) || !dd->kregbase)
122                         continue;
123                 for (pidx = 0; pidx < dd->num_pports; ++pidx) {
124                         ppd = dd->pport + pidx;
125                         if (ppd->lid && (ppd->lflags & (QIBL_LINKINIT |
126                                          QIBL_LINKARMED | QIBL_LINKACTIVE))) {
127                                 nunits_active++;
128                                 break;
129                         }
130                 }
131         }
132         spin_unlock_irqrestore(&qib_devs_lock, flags);
133         return nunits_active;
134 }
135
136 /*
137  * Return count of all units, optionally return in arguments
138  * the number of usable (present) units, and the number of
139  * ports that are up.
140  */
141 int qib_count_units(int *npresentp, int *nupp)
142 {
143         int nunits = 0, npresent = 0, nup = 0;
144         struct qib_devdata *dd;
145         unsigned long flags;
146         int pidx;
147         struct qib_pportdata *ppd;
148
149         spin_lock_irqsave(&qib_devs_lock, flags);
150
151         list_for_each_entry(dd, &qib_dev_list, list) {
152                 nunits++;
153                 if ((dd->flags & QIB_PRESENT) && dd->kregbase)
154                         npresent++;
155                 for (pidx = 0; pidx < dd->num_pports; ++pidx) {
156                         ppd = dd->pport + pidx;
157                         if (ppd->lid && (ppd->lflags & (QIBL_LINKINIT |
158                                          QIBL_LINKARMED | QIBL_LINKACTIVE)))
159                                 nup++;
160                 }
161         }
162
163         spin_unlock_irqrestore(&qib_devs_lock, flags);
164
165         if (npresentp)
166                 *npresentp = npresent;
167         if (nupp)
168                 *nupp = nup;
169
170         return nunits;
171 }
172
173 /**
174  * qib_wait_linkstate - wait for an IB link state change to occur
175  * @dd: the qlogic_ib device
176  * @state: the state to wait for
177  * @msecs: the number of milliseconds to wait
178  *
179  * wait up to msecs milliseconds for IB link state change to occur for
180  * now, take the easy polling route.  Currently used only by
181  * qib_set_linkstate.  Returns 0 if state reached, otherwise
182  * -ETIMEDOUT state can have multiple states set, for any of several
183  * transitions.
184  */
185 int qib_wait_linkstate(struct qib_pportdata *ppd, u32 state, int msecs)
186 {
187         int ret;
188         unsigned long flags;
189
190         spin_lock_irqsave(&ppd->lflags_lock, flags);
191         if (ppd->state_wanted) {
192                 spin_unlock_irqrestore(&ppd->lflags_lock, flags);
193                 ret = -EBUSY;
194                 goto bail;
195         }
196         ppd->state_wanted = state;
197         spin_unlock_irqrestore(&ppd->lflags_lock, flags);
198         wait_event_interruptible_timeout(ppd->state_wait,
199                                          (ppd->lflags & state),
200                                          msecs_to_jiffies(msecs));
201         spin_lock_irqsave(&ppd->lflags_lock, flags);
202         ppd->state_wanted = 0;
203         spin_unlock_irqrestore(&ppd->lflags_lock, flags);
204
205         if (!(ppd->lflags & state))
206                 ret = -ETIMEDOUT;
207         else
208                 ret = 0;
209 bail:
210         return ret;
211 }
212
213 int qib_set_linkstate(struct qib_pportdata *ppd, u8 newstate)
214 {
215         u32 lstate;
216         int ret;
217         struct qib_devdata *dd = ppd->dd;
218         unsigned long flags;
219
220         switch (newstate) {
221         case QIB_IB_LINKDOWN_ONLY:
222                 dd->f_set_ib_cfg(ppd, QIB_IB_CFG_LSTATE,
223                                  IB_LINKCMD_DOWN | IB_LINKINITCMD_NOP);
224                 /* don't wait */
225                 ret = 0;
226                 goto bail;
227
228         case QIB_IB_LINKDOWN:
229                 dd->f_set_ib_cfg(ppd, QIB_IB_CFG_LSTATE,
230                                  IB_LINKCMD_DOWN | IB_LINKINITCMD_POLL);
231                 /* don't wait */
232                 ret = 0;
233                 goto bail;
234
235         case QIB_IB_LINKDOWN_SLEEP:
236                 dd->f_set_ib_cfg(ppd, QIB_IB_CFG_LSTATE,
237                                  IB_LINKCMD_DOWN | IB_LINKINITCMD_SLEEP);
238                 /* don't wait */
239                 ret = 0;
240                 goto bail;
241
242         case QIB_IB_LINKDOWN_DISABLE:
243                 dd->f_set_ib_cfg(ppd, QIB_IB_CFG_LSTATE,
244                                  IB_LINKCMD_DOWN | IB_LINKINITCMD_DISABLE);
245                 /* don't wait */
246                 ret = 0;
247                 goto bail;
248
249         case QIB_IB_LINKARM:
250                 if (ppd->lflags & QIBL_LINKARMED) {
251                         ret = 0;
252                         goto bail;
253                 }
254                 if (!(ppd->lflags & (QIBL_LINKINIT | QIBL_LINKACTIVE))) {
255                         ret = -EINVAL;
256                         goto bail;
257                 }
258                 /*
259                  * Since the port can be ACTIVE when we ask for ARMED,
260                  * clear QIBL_LINKV so we can wait for a transition.
261                  * If the link isn't ARMED, then something else happened
262                  * and there is no point waiting for ARMED.
263                  */
264                 spin_lock_irqsave(&ppd->lflags_lock, flags);
265                 ppd->lflags &= ~QIBL_LINKV;
266                 spin_unlock_irqrestore(&ppd->lflags_lock, flags);
267                 dd->f_set_ib_cfg(ppd, QIB_IB_CFG_LSTATE,
268                                  IB_LINKCMD_ARMED | IB_LINKINITCMD_NOP);
269                 lstate = QIBL_LINKV;
270                 break;
271
272         case QIB_IB_LINKACTIVE:
273                 if (ppd->lflags & QIBL_LINKACTIVE) {
274                         ret = 0;
275                         goto bail;
276                 }
277                 if (!(ppd->lflags & QIBL_LINKARMED)) {
278                         ret = -EINVAL;
279                         goto bail;
280                 }
281                 dd->f_set_ib_cfg(ppd, QIB_IB_CFG_LSTATE,
282                                  IB_LINKCMD_ACTIVE | IB_LINKINITCMD_NOP);
283                 lstate = QIBL_LINKACTIVE;
284                 break;
285
286         default:
287                 ret = -EINVAL;
288                 goto bail;
289         }
290         ret = qib_wait_linkstate(ppd, lstate, 10);
291
292 bail:
293         return ret;
294 }
295
296 /*
297  * Get address of eager buffer from it's index (allocated in chunks, not
298  * contiguous).
299  */
300 static inline void *qib_get_egrbuf(const struct qib_ctxtdata *rcd, u32 etail)
301 {
302         const u32 chunk = etail >> rcd->rcvegrbufs_perchunk_shift;
303         const u32 idx =  etail & ((u32)rcd->rcvegrbufs_perchunk - 1);
304
305         return rcd->rcvegrbuf[chunk] + (idx << rcd->dd->rcvegrbufsize_shift);
306 }
307
308 /*
309  * Returns 1 if error was a CRC, else 0.
310  * Needed for some chip's synthesized error counters.
311  */
312 static u32 qib_rcv_hdrerr(struct qib_ctxtdata *rcd, struct qib_pportdata *ppd,
313                           u32 ctxt, u32 eflags, u32 l, u32 etail,
314                           __le32 *rhf_addr, struct qib_message_header *rhdr)
315 {
316         u32 ret = 0;
317
318         if (eflags & (QLOGIC_IB_RHF_H_ICRCERR | QLOGIC_IB_RHF_H_VCRCERR))
319                 ret = 1;
320         else if (eflags == QLOGIC_IB_RHF_H_TIDERR) {
321                 /* For TIDERR and RC QPs premptively schedule a NAK */
322                 struct ib_header *hdr = (struct ib_header *)rhdr;
323                 struct ib_other_headers *ohdr = NULL;
324                 struct qib_ibport *ibp = &ppd->ibport_data;
325                 struct qib_devdata *dd = ppd->dd;
326                 struct rvt_dev_info *rdi = &dd->verbs_dev.rdi;
327                 struct rvt_qp *qp = NULL;
328                 u32 tlen = qib_hdrget_length_in_bytes(rhf_addr);
329                 u16 lid  = be16_to_cpu(hdr->lrh[1]);
330                 int lnh = be16_to_cpu(hdr->lrh[0]) & 3;
331                 u32 qp_num;
332                 u32 opcode;
333                 u32 psn;
334                 int diff;
335
336                 /* Sanity check packet */
337                 if (tlen < 24)
338                         goto drop;
339
340                 if (lid < be16_to_cpu(IB_MULTICAST_LID_BASE)) {
341                         lid &= ~((1 << ppd->lmc) - 1);
342                         if (unlikely(lid != ppd->lid))
343                                 goto drop;
344                 }
345
346                 /* Check for GRH */
347                 if (lnh == QIB_LRH_BTH)
348                         ohdr = &hdr->u.oth;
349                 else if (lnh == QIB_LRH_GRH) {
350                         u32 vtf;
351
352                         ohdr = &hdr->u.l.oth;
353                         if (hdr->u.l.grh.next_hdr != IB_GRH_NEXT_HDR)
354                                 goto drop;
355                         vtf = be32_to_cpu(hdr->u.l.grh.version_tclass_flow);
356                         if ((vtf >> IB_GRH_VERSION_SHIFT) != IB_GRH_VERSION)
357                                 goto drop;
358                 } else
359                         goto drop;
360
361                 /* Get opcode and PSN from packet */
362                 opcode = be32_to_cpu(ohdr->bth[0]);
363                 opcode >>= 24;
364                 psn = be32_to_cpu(ohdr->bth[2]);
365
366                 /* Get the destination QP number. */
367                 qp_num = be32_to_cpu(ohdr->bth[1]) & RVT_QPN_MASK;
368                 if (qp_num != QIB_MULTICAST_QPN) {
369                         int ruc_res;
370
371                         rcu_read_lock();
372                         qp = rvt_lookup_qpn(rdi, &ibp->rvp, qp_num);
373                         if (!qp) {
374                                 rcu_read_unlock();
375                                 goto drop;
376                         }
377
378                         /*
379                          * Handle only RC QPs - for other QP types drop error
380                          * packet.
381                          */
382                         spin_lock(&qp->r_lock);
383
384                         /* Check for valid receive state. */
385                         if (!(ib_rvt_state_ops[qp->state] &
386                               RVT_PROCESS_RECV_OK)) {
387                                 ibp->rvp.n_pkt_drops++;
388                                 goto unlock;
389                         }
390
391                         switch (qp->ibqp.qp_type) {
392                         case IB_QPT_RC:
393                                 ruc_res =
394                                         qib_ruc_check_hdr(
395                                                 ibp, hdr,
396                                                 lnh == QIB_LRH_GRH,
397                                                 qp,
398                                                 be32_to_cpu(ohdr->bth[0]));
399                                 if (ruc_res)
400                                         goto unlock;
401
402                                 /* Only deal with RDMA Writes for now */
403                                 if (opcode <
404                                     IB_OPCODE_RC_RDMA_READ_RESPONSE_FIRST) {
405                                         diff = qib_cmp24(psn, qp->r_psn);
406                                         if (!qp->r_nak_state && diff >= 0) {
407                                                 ibp->rvp.n_rc_seqnak++;
408                                                 qp->r_nak_state =
409                                                         IB_NAK_PSN_ERROR;
410                                                 /* Use the expected PSN. */
411                                                 qp->r_ack_psn = qp->r_psn;
412                                                 /*
413                                                  * Wait to send the sequence
414                                                  * NAK until all packets
415                                                  * in the receive queue have
416                                                  * been processed.
417                                                  * Otherwise, we end up
418                                                  * propagating congestion.
419                                                  */
420                                                 if (list_empty(&qp->rspwait)) {
421                                                         qp->r_flags |=
422                                                                 RVT_R_RSP_NAK;
423                                                         atomic_inc(
424                                                                 &qp->refcount);
425                                                         list_add_tail(
426                                                          &qp->rspwait,
427                                                          &rcd->qp_wait_list);
428                                                 }
429                                         } /* Out of sequence NAK */
430                                 } /* QP Request NAKs */
431                                 break;
432                         case IB_QPT_SMI:
433                         case IB_QPT_GSI:
434                         case IB_QPT_UD:
435                         case IB_QPT_UC:
436                         default:
437                                 /* For now don't handle any other QP types */
438                                 break;
439                         }
440
441 unlock:
442                         spin_unlock(&qp->r_lock);
443                         rcu_read_unlock();
444                 } /* Unicast QP */
445         } /* Valid packet with TIDErr */
446
447 drop:
448         return ret;
449 }
450
451 /*
452  * qib_kreceive - receive a packet
453  * @rcd: the qlogic_ib context
454  * @llic: gets count of good packets needed to clear lli,
455  *          (used with chips that need need to track crcs for lli)
456  *
457  * called from interrupt handler for errors or receive interrupt
458  * Returns number of CRC error packets, needed by some chips for
459  * local link integrity tracking.   crcs are adjusted down by following
460  * good packets, if any, and count of good packets is also tracked.
461  */
462 u32 qib_kreceive(struct qib_ctxtdata *rcd, u32 *llic, u32 *npkts)
463 {
464         struct qib_devdata *dd = rcd->dd;
465         struct qib_pportdata *ppd = rcd->ppd;
466         __le32 *rhf_addr;
467         void *ebuf;
468         const u32 rsize = dd->rcvhdrentsize;        /* words */
469         const u32 maxcnt = dd->rcvhdrcnt * rsize;   /* words */
470         u32 etail = -1, l, hdrqtail;
471         struct qib_message_header *hdr;
472         u32 eflags, etype, tlen, i = 0, updegr = 0, crcs = 0;
473         int last;
474         u64 lval;
475         struct rvt_qp *qp, *nqp;
476
477         l = rcd->head;
478         rhf_addr = (__le32 *) rcd->rcvhdrq + l + dd->rhf_offset;
479         if (dd->flags & QIB_NODMA_RTAIL) {
480                 u32 seq = qib_hdrget_seq(rhf_addr);
481
482                 if (seq != rcd->seq_cnt)
483                         goto bail;
484                 hdrqtail = 0;
485         } else {
486                 hdrqtail = qib_get_rcvhdrtail(rcd);
487                 if (l == hdrqtail)
488                         goto bail;
489                 smp_rmb();  /* prevent speculative reads of dma'ed hdrq */
490         }
491
492         for (last = 0, i = 1; !last; i += !last) {
493                 hdr = dd->f_get_msgheader(dd, rhf_addr);
494                 eflags = qib_hdrget_err_flags(rhf_addr);
495                 etype = qib_hdrget_rcv_type(rhf_addr);
496                 /* total length */
497                 tlen = qib_hdrget_length_in_bytes(rhf_addr);
498                 ebuf = NULL;
499                 if ((dd->flags & QIB_NODMA_RTAIL) ?
500                     qib_hdrget_use_egr_buf(rhf_addr) :
501                     (etype != RCVHQ_RCV_TYPE_EXPECTED)) {
502                         etail = qib_hdrget_index(rhf_addr);
503                         updegr = 1;
504                         if (tlen > sizeof(*hdr) ||
505                             etype >= RCVHQ_RCV_TYPE_NON_KD) {
506                                 ebuf = qib_get_egrbuf(rcd, etail);
507                                 prefetch_range(ebuf, tlen - sizeof(*hdr));
508                         }
509                 }
510                 if (!eflags) {
511                         u16 lrh_len = be16_to_cpu(hdr->lrh[2]) << 2;
512
513                         if (lrh_len != tlen) {
514                                 qib_stats.sps_lenerrs++;
515                                 goto move_along;
516                         }
517                 }
518                 if (etype == RCVHQ_RCV_TYPE_NON_KD && !eflags &&
519                     ebuf == NULL &&
520                     tlen > (dd->rcvhdrentsize - 2 + 1 -
521                                 qib_hdrget_offset(rhf_addr)) << 2) {
522                         goto move_along;
523                 }
524
525                 /*
526                  * Both tiderr and qibhdrerr are set for all plain IB
527                  * packets; only qibhdrerr should be set.
528                  */
529                 if (unlikely(eflags))
530                         crcs += qib_rcv_hdrerr(rcd, ppd, rcd->ctxt, eflags, l,
531                                                etail, rhf_addr, hdr);
532                 else if (etype == RCVHQ_RCV_TYPE_NON_KD) {
533                         qib_ib_rcv(rcd, hdr, ebuf, tlen);
534                         if (crcs)
535                                 crcs--;
536                         else if (llic && *llic)
537                                 --*llic;
538                 }
539 move_along:
540                 l += rsize;
541                 if (l >= maxcnt)
542                         l = 0;
543                 if (i == QIB_MAX_PKT_RECV)
544                         last = 1;
545
546                 rhf_addr = (__le32 *) rcd->rcvhdrq + l + dd->rhf_offset;
547                 if (dd->flags & QIB_NODMA_RTAIL) {
548                         u32 seq = qib_hdrget_seq(rhf_addr);
549
550                         if (++rcd->seq_cnt > 13)
551                                 rcd->seq_cnt = 1;
552                         if (seq != rcd->seq_cnt)
553                                 last = 1;
554                 } else if (l == hdrqtail)
555                         last = 1;
556                 /*
557                  * Update head regs etc., every 16 packets, if not last pkt,
558                  * to help prevent rcvhdrq overflows, when many packets
559                  * are processed and queue is nearly full.
560                  * Don't request an interrupt for intermediate updates.
561                  */
562                 lval = l;
563                 if (!last && !(i & 0xf)) {
564                         dd->f_update_usrhead(rcd, lval, updegr, etail, i);
565                         updegr = 0;
566                 }
567         }
568
569         rcd->head = l;
570
571         /*
572          * Iterate over all QPs waiting to respond.
573          * The list won't change since the IRQ is only run on one CPU.
574          */
575         list_for_each_entry_safe(qp, nqp, &rcd->qp_wait_list, rspwait) {
576                 list_del_init(&qp->rspwait);
577                 if (qp->r_flags & RVT_R_RSP_NAK) {
578                         qp->r_flags &= ~RVT_R_RSP_NAK;
579                         qib_send_rc_ack(qp);
580                 }
581                 if (qp->r_flags & RVT_R_RSP_SEND) {
582                         unsigned long flags;
583
584                         qp->r_flags &= ~RVT_R_RSP_SEND;
585                         spin_lock_irqsave(&qp->s_lock, flags);
586                         if (ib_rvt_state_ops[qp->state] &
587                                         RVT_PROCESS_OR_FLUSH_SEND)
588                                 qib_schedule_send(qp);
589                         spin_unlock_irqrestore(&qp->s_lock, flags);
590                 }
591                 rvt_put_qp(qp);
592         }
593
594 bail:
595         /* Report number of packets consumed */
596         if (npkts)
597                 *npkts = i;
598
599         /*
600          * Always write head at end, and setup rcv interrupt, even
601          * if no packets were processed.
602          */
603         lval = (u64)rcd->head | dd->rhdrhead_intr_off;
604         dd->f_update_usrhead(rcd, lval, updegr, etail, i);
605         return crcs;
606 }
607
608 /**
609  * qib_set_mtu - set the MTU
610  * @ppd: the perport data
611  * @arg: the new MTU
612  *
613  * We can handle "any" incoming size, the issue here is whether we
614  * need to restrict our outgoing size.   For now, we don't do any
615  * sanity checking on this, and we don't deal with what happens to
616  * programs that are already running when the size changes.
617  * NOTE: changing the MTU will usually cause the IBC to go back to
618  * link INIT state...
619  */
620 int qib_set_mtu(struct qib_pportdata *ppd, u16 arg)
621 {
622         u32 piosize;
623         int ret, chk;
624
625         if (arg != 256 && arg != 512 && arg != 1024 && arg != 2048 &&
626             arg != 4096) {
627                 ret = -EINVAL;
628                 goto bail;
629         }
630         chk = ib_mtu_enum_to_int(qib_ibmtu);
631         if (chk > 0 && arg > chk) {
632                 ret = -EINVAL;
633                 goto bail;
634         }
635
636         piosize = ppd->ibmaxlen;
637         ppd->ibmtu = arg;
638
639         if (arg >= (piosize - QIB_PIO_MAXIBHDR)) {
640                 /* Only if it's not the initial value (or reset to it) */
641                 if (piosize != ppd->init_ibmaxlen) {
642                         if (arg > piosize && arg <= ppd->init_ibmaxlen)
643                                 piosize = ppd->init_ibmaxlen - 2 * sizeof(u32);
644                         ppd->ibmaxlen = piosize;
645                 }
646         } else if ((arg + QIB_PIO_MAXIBHDR) != ppd->ibmaxlen) {
647                 piosize = arg + QIB_PIO_MAXIBHDR - 2 * sizeof(u32);
648                 ppd->ibmaxlen = piosize;
649         }
650
651         ppd->dd->f_set_ib_cfg(ppd, QIB_IB_CFG_MTU, 0);
652
653         ret = 0;
654
655 bail:
656         return ret;
657 }
658
659 int qib_set_lid(struct qib_pportdata *ppd, u32 lid, u8 lmc)
660 {
661         struct qib_devdata *dd = ppd->dd;
662
663         ppd->lid = lid;
664         ppd->lmc = lmc;
665
666         dd->f_set_ib_cfg(ppd, QIB_IB_CFG_LIDLMC,
667                          lid | (~((1U << lmc) - 1)) << 16);
668
669         qib_devinfo(dd->pcidev, "IB%u:%u got a lid: 0x%x\n",
670                     dd->unit, ppd->port, lid);
671
672         return 0;
673 }
674
675 /*
676  * Following deal with the "obviously simple" task of overriding the state
677  * of the LEDS, which normally indicate link physical and logical status.
678  * The complications arise in dealing with different hardware mappings
679  * and the board-dependent routine being called from interrupts.
680  * and then there's the requirement to _flash_ them.
681  */
682 #define LED_OVER_FREQ_SHIFT 8
683 #define LED_OVER_FREQ_MASK (0xFF<<LED_OVER_FREQ_SHIFT)
684 /* Below is "non-zero" to force override, but both actual LEDs are off */
685 #define LED_OVER_BOTH_OFF (8)
686
687 static void qib_run_led_override(unsigned long opaque)
688 {
689         struct qib_pportdata *ppd = (struct qib_pportdata *)opaque;
690         struct qib_devdata *dd = ppd->dd;
691         int timeoff;
692         int ph_idx;
693
694         if (!(dd->flags & QIB_INITTED))
695                 return;
696
697         ph_idx = ppd->led_override_phase++ & 1;
698         ppd->led_override = ppd->led_override_vals[ph_idx];
699         timeoff = ppd->led_override_timeoff;
700
701         dd->f_setextled(ppd, 1);
702         /*
703          * don't re-fire the timer if user asked for it to be off; we let
704          * it fire one more time after they turn it off to simplify
705          */
706         if (ppd->led_override_vals[0] || ppd->led_override_vals[1])
707                 mod_timer(&ppd->led_override_timer, jiffies + timeoff);
708 }
709
710 void qib_set_led_override(struct qib_pportdata *ppd, unsigned int val)
711 {
712         struct qib_devdata *dd = ppd->dd;
713         int timeoff, freq;
714
715         if (!(dd->flags & QIB_INITTED))
716                 return;
717
718         /* First check if we are blinking. If not, use 1HZ polling */
719         timeoff = HZ;
720         freq = (val & LED_OVER_FREQ_MASK) >> LED_OVER_FREQ_SHIFT;
721
722         if (freq) {
723                 /* For blink, set each phase from one nybble of val */
724                 ppd->led_override_vals[0] = val & 0xF;
725                 ppd->led_override_vals[1] = (val >> 4) & 0xF;
726                 timeoff = (HZ << 4)/freq;
727         } else {
728                 /* Non-blink set both phases the same. */
729                 ppd->led_override_vals[0] = val & 0xF;
730                 ppd->led_override_vals[1] = val & 0xF;
731         }
732         ppd->led_override_timeoff = timeoff;
733
734         /*
735          * If the timer has not already been started, do so. Use a "quick"
736          * timeout so the function will be called soon, to look at our request.
737          */
738         if (atomic_inc_return(&ppd->led_override_timer_active) == 1) {
739                 /* Need to start timer */
740                 init_timer(&ppd->led_override_timer);
741                 ppd->led_override_timer.function = qib_run_led_override;
742                 ppd->led_override_timer.data = (unsigned long) ppd;
743                 ppd->led_override_timer.expires = jiffies + 1;
744                 add_timer(&ppd->led_override_timer);
745         } else {
746                 if (ppd->led_override_vals[0] || ppd->led_override_vals[1])
747                         mod_timer(&ppd->led_override_timer, jiffies + 1);
748                 atomic_dec(&ppd->led_override_timer_active);
749         }
750 }
751
752 /**
753  * qib_reset_device - reset the chip if possible
754  * @unit: the device to reset
755  *
756  * Whether or not reset is successful, we attempt to re-initialize the chip
757  * (that is, much like a driver unload/reload).  We clear the INITTED flag
758  * so that the various entry points will fail until we reinitialize.  For
759  * now, we only allow this if no user contexts are open that use chip resources
760  */
761 int qib_reset_device(int unit)
762 {
763         int ret, i;
764         struct qib_devdata *dd = qib_lookup(unit);
765         struct qib_pportdata *ppd;
766         unsigned long flags;
767         int pidx;
768
769         if (!dd) {
770                 ret = -ENODEV;
771                 goto bail;
772         }
773
774         qib_devinfo(dd->pcidev, "Reset on unit %u requested\n", unit);
775
776         if (!dd->kregbase || !(dd->flags & QIB_PRESENT)) {
777                 qib_devinfo(dd->pcidev,
778                         "Invalid unit number %u or not initialized or not present\n",
779                         unit);
780                 ret = -ENXIO;
781                 goto bail;
782         }
783
784         spin_lock_irqsave(&dd->uctxt_lock, flags);
785         if (dd->rcd)
786                 for (i = dd->first_user_ctxt; i < dd->cfgctxts; i++) {
787                         if (!dd->rcd[i] || !dd->rcd[i]->cnt)
788                                 continue;
789                         spin_unlock_irqrestore(&dd->uctxt_lock, flags);
790                         ret = -EBUSY;
791                         goto bail;
792                 }
793         spin_unlock_irqrestore(&dd->uctxt_lock, flags);
794
795         for (pidx = 0; pidx < dd->num_pports; ++pidx) {
796                 ppd = dd->pport + pidx;
797                 if (atomic_read(&ppd->led_override_timer_active)) {
798                         /* Need to stop LED timer, _then_ shut off LEDs */
799                         del_timer_sync(&ppd->led_override_timer);
800                         atomic_set(&ppd->led_override_timer_active, 0);
801                 }
802
803                 /* Shut off LEDs after we are sure timer is not running */
804                 ppd->led_override = LED_OVER_BOTH_OFF;
805                 dd->f_setextled(ppd, 0);
806                 if (dd->flags & QIB_HAS_SEND_DMA)
807                         qib_teardown_sdma(ppd);
808         }
809
810         ret = dd->f_reset(dd);
811         if (ret == 1)
812                 ret = qib_init(dd, 1);
813         else
814                 ret = -EAGAIN;
815         if (ret)
816                 qib_dev_err(dd,
817                         "Reinitialize unit %u after reset failed with %d\n",
818                         unit, ret);
819         else
820                 qib_devinfo(dd->pcidev,
821                         "Reinitialized unit %u after resetting\n",
822                         unit);
823
824 bail:
825         return ret;
826 }