1/*
2 * cxgb3i_offload.c: Chelsio S3xx iscsi offloaded tcp connection management
3 *
4 * Copyright (C) 2003-2008 Chelsio Communications.  All rights reserved.
5 *
6 * This program is distributed in the hope that it will be useful, but WITHOUT
7 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
8 * FITNESS FOR A PARTICULAR PURPOSE.  See the LICENSE file included in this
9 * release for licensing terms and conditions.
10 *
11 * Written by:	Dimitris Michailidis (dm@chelsio.com)
12 *		Karen Xie (kxie@chelsio.com)
13 */
14
15#define pr_fmt(fmt) KBUILD_MODNAME ":%s: " fmt, __func__
16
17#include <linux/module.h>
18#include <linux/moduleparam.h>
19#include <scsi/scsi_host.h>
20
21#include "common.h"
22#include "t3_cpl.h"
23#include "t3cdev.h"
24#include "cxgb3_defs.h"
25#include "cxgb3_ctl_defs.h"
26#include "cxgb3_offload.h"
27#include "firmware_exports.h"
28#include "cxgb3i.h"
29
30static unsigned int dbg_level;
31#include "../libcxgbi.h"
32
33#define DRV_MODULE_NAME         "cxgb3i"
34#define DRV_MODULE_DESC         "Chelsio T3 iSCSI Driver"
35#define DRV_MODULE_VERSION	"2.0.0"
36#define DRV_MODULE_RELDATE	"Jun. 2010"
37
38static char version[] =
39	DRV_MODULE_DESC " " DRV_MODULE_NAME
40	" v" DRV_MODULE_VERSION " (" DRV_MODULE_RELDATE ")\n";
41
42MODULE_AUTHOR("Chelsio Communications, Inc.");
43MODULE_DESCRIPTION(DRV_MODULE_DESC);
44MODULE_VERSION(DRV_MODULE_VERSION);
45MODULE_LICENSE("GPL");
46
47module_param(dbg_level, uint, 0644);
48MODULE_PARM_DESC(dbg_level, "debug flag (default=0)");
49
50static int cxgb3i_rcv_win = 256 * 1024;
51module_param(cxgb3i_rcv_win, int, 0644);
52MODULE_PARM_DESC(cxgb3i_rcv_win, "TCP receive window in bytes (default=256KB)");
53
54static int cxgb3i_snd_win = 128 * 1024;
55module_param(cxgb3i_snd_win, int, 0644);
56MODULE_PARM_DESC(cxgb3i_snd_win, "TCP send window in bytes (default=128KB)");
57
58static int cxgb3i_rx_credit_thres = 10 * 1024;
59module_param(cxgb3i_rx_credit_thres, int, 0644);
60MODULE_PARM_DESC(rx_credit_thres,
61		 "RX credits return threshold in bytes (default=10KB)");
62
63static unsigned int cxgb3i_max_connect = 8 * 1024;
64module_param(cxgb3i_max_connect, uint, 0644);
65MODULE_PARM_DESC(cxgb3i_max_connect, "Max. # of connections (default=8092)");
66
67static unsigned int cxgb3i_sport_base = 20000;
68module_param(cxgb3i_sport_base, uint, 0644);
69MODULE_PARM_DESC(cxgb3i_sport_base, "starting port number (default=20000)");
70
71static void cxgb3i_dev_open(struct t3cdev *);
72static void cxgb3i_dev_close(struct t3cdev *);
73static void cxgb3i_dev_event_handler(struct t3cdev *, u32, u32);
74
75static struct cxgb3_client t3_client = {
76	.name = DRV_MODULE_NAME,
77	.handlers = cxgb3i_cpl_handlers,
78	.add = cxgb3i_dev_open,
79	.remove = cxgb3i_dev_close,
80	.event_handler = cxgb3i_dev_event_handler,
81};
82
83static struct scsi_host_template cxgb3i_host_template = {
84	.module		= THIS_MODULE,
85	.name		= DRV_MODULE_NAME,
86	.proc_name	= DRV_MODULE_NAME,
87	.can_queue	= CXGB3I_SCSI_HOST_QDEPTH,
88	.queuecommand	= iscsi_queuecommand,
89	.change_queue_depth = scsi_change_queue_depth,
90	.sg_tablesize	= SG_ALL,
91	.max_sectors	= 0xFFFF,
92	.cmd_per_lun	= ISCSI_DEF_CMD_PER_LUN,
93	.eh_abort_handler = iscsi_eh_abort,
94	.eh_device_reset_handler = iscsi_eh_device_reset,
95	.eh_target_reset_handler = iscsi_eh_recover_target,
96	.target_alloc	= iscsi_target_alloc,
97	.use_clustering	= DISABLE_CLUSTERING,
98	.this_id	= -1,
99	.track_queue_depth = 1,
100};
101
102static struct iscsi_transport cxgb3i_iscsi_transport = {
103	.owner		= THIS_MODULE,
104	.name		= DRV_MODULE_NAME,
105	/* owner and name should be set already */
106	.caps		= CAP_RECOVERY_L0 | CAP_MULTI_R2T | CAP_HDRDGST
107				| CAP_DATADGST | CAP_DIGEST_OFFLOAD |
108				CAP_PADDING_OFFLOAD | CAP_TEXT_NEGO,
109	.attr_is_visible	= cxgbi_attr_is_visible,
110	.get_host_param	= cxgbi_get_host_param,
111	.set_host_param	= cxgbi_set_host_param,
112	/* session management */
113	.create_session	= cxgbi_create_session,
114	.destroy_session	= cxgbi_destroy_session,
115	.get_session_param = iscsi_session_get_param,
116	/* connection management */
117	.create_conn	= cxgbi_create_conn,
118	.bind_conn	= cxgbi_bind_conn,
119	.destroy_conn	= iscsi_tcp_conn_teardown,
120	.start_conn	= iscsi_conn_start,
121	.stop_conn	= iscsi_conn_stop,
122	.get_conn_param	= iscsi_conn_get_param,
123	.set_param	= cxgbi_set_conn_param,
124	.get_stats	= cxgbi_get_conn_stats,
125	/* pdu xmit req from user space */
126	.send_pdu	= iscsi_conn_send_pdu,
127	/* task */
128	.init_task	= iscsi_tcp_task_init,
129	.xmit_task	= iscsi_tcp_task_xmit,
130	.cleanup_task	= cxgbi_cleanup_task,
131	/* pdu */
132	.alloc_pdu	= cxgbi_conn_alloc_pdu,
133	.init_pdu	= cxgbi_conn_init_pdu,
134	.xmit_pdu	= cxgbi_conn_xmit_pdu,
135	.parse_pdu_itt	= cxgbi_parse_pdu_itt,
136	/* TCP connect/disconnect */
137	.get_ep_param	= cxgbi_get_ep_param,
138	.ep_connect	= cxgbi_ep_connect,
139	.ep_poll	= cxgbi_ep_poll,
140	.ep_disconnect	= cxgbi_ep_disconnect,
141	/* Error recovery timeout call */
142	.session_recovery_timedout = iscsi_session_recovery_timedout,
143};
144
145static struct scsi_transport_template *cxgb3i_stt;
146
147/*
148 * CPL (Chelsio Protocol Language) defines a message passing interface between
149 * the host driver and Chelsio asic.
150 * The section below implments CPLs that related to iscsi tcp connection
151 * open/close/abort and data send/receive.
152 */
153
154static int push_tx_frames(struct cxgbi_sock *csk, int req_completion);
155
156static void send_act_open_req(struct cxgbi_sock *csk, struct sk_buff *skb,
157			      const struct l2t_entry *e)
158{
159	unsigned int wscale = cxgbi_sock_compute_wscale(cxgb3i_rcv_win);
160	struct cpl_act_open_req *req = (struct cpl_act_open_req *)skb->head;
161
162	skb->priority = CPL_PRIORITY_SETUP;
163
164	req->wr.wr_hi = htonl(V_WR_OP(FW_WROPCODE_FORWARD));
165	OPCODE_TID(req) = htonl(MK_OPCODE_TID(CPL_ACT_OPEN_REQ, csk->atid));
166	req->local_port = csk->saddr.sin_port;
167	req->peer_port = csk->daddr.sin_port;
168	req->local_ip = csk->saddr.sin_addr.s_addr;
169	req->peer_ip = csk->daddr.sin_addr.s_addr;
170
171	req->opt0h = htonl(V_KEEP_ALIVE(1) | F_TCAM_BYPASS |
172			V_WND_SCALE(wscale) | V_MSS_IDX(csk->mss_idx) |
173			V_L2T_IDX(e->idx) | V_TX_CHANNEL(e->smt_idx));
174	req->opt0l = htonl(V_ULP_MODE(ULP2_MODE_ISCSI) |
175			V_RCV_BUFSIZ(cxgb3i_rcv_win>>10));
176
177	log_debug(1 << CXGBI_DBG_TOE | 1 << CXGBI_DBG_SOCK,
178		"csk 0x%p,%u,0x%lx,%u, %pI4:%u-%pI4:%u, %u,%u,%u.\n",
179		csk, csk->state, csk->flags, csk->atid,
180		&req->local_ip, ntohs(req->local_port),
181		&req->peer_ip, ntohs(req->peer_port),
182		csk->mss_idx, e->idx, e->smt_idx);
183
184	l2t_send(csk->cdev->lldev, skb, csk->l2t);
185}
186
187static inline void act_open_arp_failure(struct t3cdev *dev, struct sk_buff *skb)
188{
189	cxgbi_sock_act_open_req_arp_failure(NULL, skb);
190}
191
192/*
193 * CPL connection close request: host ->
194 *
195 * Close a connection by sending a CPL_CLOSE_CON_REQ message and queue it to
196 * the write queue (i.e., after any unsent txt data).
197 */
198static void send_close_req(struct cxgbi_sock *csk)
199{
200	struct sk_buff *skb = csk->cpl_close;
201	struct cpl_close_con_req *req = (struct cpl_close_con_req *)skb->head;
202	unsigned int tid = csk->tid;
203
204	log_debug(1 << CXGBI_DBG_TOE | 1 << CXGBI_DBG_SOCK,
205		"csk 0x%p,%u,0x%lx,%u.\n",
206		csk, csk->state, csk->flags, csk->tid);
207
208	csk->cpl_close = NULL;
209	req->wr.wr_hi = htonl(V_WR_OP(FW_WROPCODE_OFLD_CLOSE_CON));
210	req->wr.wr_lo = htonl(V_WR_TID(tid));
211	OPCODE_TID(req) = htonl(MK_OPCODE_TID(CPL_CLOSE_CON_REQ, tid));
212	req->rsvd = htonl(csk->write_seq);
213
214	cxgbi_sock_skb_entail(csk, skb);
215	if (csk->state >= CTP_ESTABLISHED)
216		push_tx_frames(csk, 1);
217}
218
219/*
220 * CPL connection abort request: host ->
221 *
222 * Send an ABORT_REQ message. Makes sure we do not send multiple ABORT_REQs
223 * for the same connection and also that we do not try to send a message
224 * after the connection has closed.
225 */
226static void abort_arp_failure(struct t3cdev *tdev, struct sk_buff *skb)
227{
228	struct cpl_abort_req *req = cplhdr(skb);
229
230	log_debug(1 << CXGBI_DBG_TOE | 1 << CXGBI_DBG_SOCK,
231		"t3dev 0x%p, tid %u, skb 0x%p.\n",
232		tdev, GET_TID(req), skb);
233	req->cmd = CPL_ABORT_NO_RST;
234	cxgb3_ofld_send(tdev, skb);
235}
236
237static void send_abort_req(struct cxgbi_sock *csk)
238{
239	struct sk_buff *skb = csk->cpl_abort_req;
240	struct cpl_abort_req *req;
241
242	if (unlikely(csk->state == CTP_ABORTING || !skb))
243		return;
244	cxgbi_sock_set_state(csk, CTP_ABORTING);
245	cxgbi_sock_set_flag(csk, CTPF_ABORT_RPL_PENDING);
246	/* Purge the send queue so we don't send anything after an abort. */
247	cxgbi_sock_purge_write_queue(csk);
248
249	csk->cpl_abort_req = NULL;
250	req = (struct cpl_abort_req *)skb->head;
251	skb->priority = CPL_PRIORITY_DATA;
252	set_arp_failure_handler(skb, abort_arp_failure);
253	req->wr.wr_hi = htonl(V_WR_OP(FW_WROPCODE_OFLD_HOST_ABORT_CON_REQ));
254	req->wr.wr_lo = htonl(V_WR_TID(csk->tid));
255	OPCODE_TID(req) = htonl(MK_OPCODE_TID(CPL_ABORT_REQ, csk->tid));
256	req->rsvd0 = htonl(csk->snd_nxt);
257	req->rsvd1 = !cxgbi_sock_flag(csk, CTPF_TX_DATA_SENT);
258	req->cmd = CPL_ABORT_SEND_RST;
259
260	log_debug(1 << CXGBI_DBG_TOE | 1 << CXGBI_DBG_SOCK,
261		"csk 0x%p,%u,0x%lx,%u, snd_nxt %u, 0x%x.\n",
262		csk, csk->state, csk->flags, csk->tid, csk->snd_nxt,
263		req->rsvd1);
264
265	l2t_send(csk->cdev->lldev, skb, csk->l2t);
266}
267
268/*
269 * CPL connection abort reply: host ->
270 *
271 * Send an ABORT_RPL message in response of the ABORT_REQ received.
272 */
273static void send_abort_rpl(struct cxgbi_sock *csk, int rst_status)
274{
275	struct sk_buff *skb = csk->cpl_abort_rpl;
276	struct cpl_abort_rpl *rpl = (struct cpl_abort_rpl *)skb->head;
277
278	log_debug(1 << CXGBI_DBG_TOE | 1 << CXGBI_DBG_SOCK,
279		"csk 0x%p,%u,0x%lx,%u, status %d.\n",
280		csk, csk->state, csk->flags, csk->tid, rst_status);
281
282	csk->cpl_abort_rpl = NULL;
283	skb->priority = CPL_PRIORITY_DATA;
284	rpl->wr.wr_hi = htonl(V_WR_OP(FW_WROPCODE_OFLD_HOST_ABORT_CON_RPL));
285	rpl->wr.wr_lo = htonl(V_WR_TID(csk->tid));
286	OPCODE_TID(rpl) = htonl(MK_OPCODE_TID(CPL_ABORT_RPL, csk->tid));
287	rpl->cmd = rst_status;
288	cxgb3_ofld_send(csk->cdev->lldev, skb);
289}
290
291/*
292 * CPL connection rx data ack: host ->
293 * Send RX credits through an RX_DATA_ACK CPL message. Returns the number of
294 * credits sent.
295 */
296static u32 send_rx_credits(struct cxgbi_sock *csk, u32 credits)
297{
298	struct sk_buff *skb;
299	struct cpl_rx_data_ack *req;
300	u32 dack = F_RX_DACK_CHANGE | V_RX_DACK_MODE(1);
301
302	log_debug(1 << CXGBI_DBG_TOE | 1 << CXGBI_DBG_PDU_RX,
303		"csk 0x%p,%u,0x%lx,%u, credit %u, dack %u.\n",
304		csk, csk->state, csk->flags, csk->tid, credits, dack);
305
306	skb = alloc_wr(sizeof(*req), 0, GFP_ATOMIC);
307	if (!skb) {
308		pr_info("csk 0x%p, credit %u, OOM.\n", csk, credits);
309		return 0;
310	}
311	req = (struct cpl_rx_data_ack *)skb->head;
312	req->wr.wr_hi = htonl(V_WR_OP(FW_WROPCODE_FORWARD));
313	OPCODE_TID(req) = htonl(MK_OPCODE_TID(CPL_RX_DATA_ACK, csk->tid));
314	req->credit_dack = htonl(F_RX_DACK_CHANGE | V_RX_DACK_MODE(1) |
315				V_RX_CREDITS(credits));
316	skb->priority = CPL_PRIORITY_ACK;
317	cxgb3_ofld_send(csk->cdev->lldev, skb);
318	return credits;
319}
320
321/*
322 * CPL connection tx data: host ->
323 *
324 * Send iscsi PDU via TX_DATA CPL message. Returns the number of
325 * credits sent.
326 * Each TX_DATA consumes work request credit (wrs), so we need to keep track of
327 * how many we've used so far and how many are pending (i.e., yet ack'ed by T3).
328 */
329
330static unsigned int wrlen __read_mostly;
331static unsigned int skb_wrs[SKB_WR_LIST_SIZE] __read_mostly;
332
333static void init_wr_tab(unsigned int wr_len)
334{
335	int i;
336
337	if (skb_wrs[1])		/* already initialized */
338		return;
339	for (i = 1; i < SKB_WR_LIST_SIZE; i++) {
340		int sgl_len = (3 * i) / 2 + (i & 1);
341
342		sgl_len += 3;
343		skb_wrs[i] = (sgl_len <= wr_len
344			      ? 1 : 1 + (sgl_len - 2) / (wr_len - 1));
345	}
346	wrlen = wr_len * 8;
347}
348
349static inline void make_tx_data_wr(struct cxgbi_sock *csk, struct sk_buff *skb,
350				   int len, int req_completion)
351{
352	struct tx_data_wr *req;
353	struct l2t_entry *l2t = csk->l2t;
354
355	skb_reset_transport_header(skb);
356	req = (struct tx_data_wr *)__skb_push(skb, sizeof(*req));
357	req->wr_hi = htonl(V_WR_OP(FW_WROPCODE_OFLD_TX_DATA) |
358			(req_completion ? F_WR_COMPL : 0));
359	req->wr_lo = htonl(V_WR_TID(csk->tid));
360	/* len includes the length of any HW ULP additions */
361	req->len = htonl(len);
362	/* V_TX_ULP_SUBMODE sets both the mode and submode */
363	req->flags = htonl(V_TX_ULP_SUBMODE(cxgbi_skcb_ulp_mode(skb)) |
364			   V_TX_SHOVE((skb_peek(&csk->write_queue) ? 0 : 1)));
365	req->sndseq = htonl(csk->snd_nxt);
366	req->param = htonl(V_TX_PORT(l2t->smt_idx));
367
368	if (!cxgbi_sock_flag(csk, CTPF_TX_DATA_SENT)) {
369		req->flags |= htonl(V_TX_ACK_PAGES(2) | F_TX_INIT |
370				    V_TX_CPU_IDX(csk->rss_qid));
371		/* sendbuffer is in units of 32KB. */
372		req->param |= htonl(V_TX_SNDBUF(cxgb3i_snd_win >> 15));
373		cxgbi_sock_set_flag(csk, CTPF_TX_DATA_SENT);
374	}
375}
376
377/**
378 * push_tx_frames -- start transmit
379 * @c3cn: the offloaded connection
380 * @req_completion: request wr_ack or not
381 *
382 * Prepends TX_DATA_WR or CPL_CLOSE_CON_REQ headers to buffers waiting in a
383 * connection's send queue and sends them on to T3.  Must be called with the
384 * connection's lock held.  Returns the amount of send buffer space that was
385 * freed as a result of sending queued data to T3.
386 */
387
388static void arp_failure_skb_discard(struct t3cdev *dev, struct sk_buff *skb)
389{
390	kfree_skb(skb);
391}
392
393static int push_tx_frames(struct cxgbi_sock *csk, int req_completion)
394{
395	int total_size = 0;
396	struct sk_buff *skb;
397
398	if (unlikely(csk->state < CTP_ESTABLISHED ||
399		csk->state == CTP_CLOSE_WAIT_1 || csk->state >= CTP_ABORTING)) {
400			log_debug(1 << CXGBI_DBG_TOE | 1 << CXGBI_DBG_PDU_TX,
401				"csk 0x%p,%u,0x%lx,%u, in closing state.\n",
402				csk, csk->state, csk->flags, csk->tid);
403		return 0;
404	}
405
406	while (csk->wr_cred && (skb = skb_peek(&csk->write_queue)) != NULL) {
407		int len = skb->len;	/* length before skb_push */
408		int frags = skb_shinfo(skb)->nr_frags + (len != skb->data_len);
409		int wrs_needed = skb_wrs[frags];
410
411		if (wrs_needed > 1 && len + sizeof(struct tx_data_wr) <= wrlen)
412			wrs_needed = 1;
413
414		WARN_ON(frags >= SKB_WR_LIST_SIZE || wrs_needed < 1);
415
416		if (csk->wr_cred < wrs_needed) {
417			log_debug(1 << CXGBI_DBG_PDU_TX,
418				"csk 0x%p, skb len %u/%u, frag %u, wr %d<%u.\n",
419				csk, skb->len, skb->data_len, frags,
420				wrs_needed, csk->wr_cred);
421			break;
422		}
423
424		__skb_unlink(skb, &csk->write_queue);
425		skb->priority = CPL_PRIORITY_DATA;
426		skb->csum = wrs_needed;	/* remember this until the WR_ACK */
427		csk->wr_cred -= wrs_needed;
428		csk->wr_una_cred += wrs_needed;
429		cxgbi_sock_enqueue_wr(csk, skb);
430
431		log_debug(1 << CXGBI_DBG_TOE | 1 << CXGBI_DBG_PDU_TX,
432			"csk 0x%p, enqueue, skb len %u/%u, frag %u, wr %d, "
433			"left %u, unack %u.\n",
434			csk, skb->len, skb->data_len, frags, skb->csum,
435			csk->wr_cred, csk->wr_una_cred);
436
437		if (likely(cxgbi_skcb_test_flag(skb, SKCBF_TX_NEED_HDR))) {
438			if ((req_completion &&
439				csk->wr_una_cred == wrs_needed) ||
440			     csk->wr_una_cred >= csk->wr_max_cred / 2) {
441				req_completion = 1;
442				csk->wr_una_cred = 0;
443			}
444			len += cxgbi_ulp_extra_len(cxgbi_skcb_ulp_mode(skb));
445			make_tx_data_wr(csk, skb, len, req_completion);
446			csk->snd_nxt += len;
447			cxgbi_skcb_clear_flag(skb, SKCBF_TX_NEED_HDR);
448		}
449		total_size += skb->truesize;
450		log_debug(1 << CXGBI_DBG_TOE | 1 << CXGBI_DBG_PDU_TX,
451			"csk 0x%p, tid 0x%x, send skb 0x%p.\n",
452			csk, csk->tid, skb);
453		set_arp_failure_handler(skb, arp_failure_skb_discard);
454		l2t_send(csk->cdev->lldev, skb, csk->l2t);
455	}
456	return total_size;
457}
458
459/*
460 * Process a CPL_ACT_ESTABLISH message: -> host
461 * Updates connection state from an active establish CPL message.  Runs with
462 * the connection lock held.
463 */
464
465static inline void free_atid(struct cxgbi_sock *csk)
466{
467	if (cxgbi_sock_flag(csk, CTPF_HAS_ATID)) {
468		cxgb3_free_atid(csk->cdev->lldev, csk->atid);
469		cxgbi_sock_clear_flag(csk, CTPF_HAS_ATID);
470		cxgbi_sock_put(csk);
471	}
472}
473
474static int do_act_establish(struct t3cdev *tdev, struct sk_buff *skb, void *ctx)
475{
476	struct cxgbi_sock *csk = ctx;
477	struct cpl_act_establish *req = cplhdr(skb);
478	unsigned int tid = GET_TID(req);
479	unsigned int atid = G_PASS_OPEN_TID(ntohl(req->tos_tid));
480	u32 rcv_isn = ntohl(req->rcv_isn);	/* real RCV_ISN + 1 */
481
482	log_debug(1 << CXGBI_DBG_TOE | 1 << CXGBI_DBG_SOCK,
483		"atid 0x%x,tid 0x%x, csk 0x%p,%u,0x%lx, isn %u.\n",
484		atid, atid, csk, csk->state, csk->flags, rcv_isn);
485
486	cxgbi_sock_get(csk);
487	cxgbi_sock_set_flag(csk, CTPF_HAS_TID);
488	csk->tid = tid;
489	cxgb3_insert_tid(csk->cdev->lldev, &t3_client, csk, tid);
490
491	free_atid(csk);
492
493	csk->rss_qid = G_QNUM(ntohs(skb->csum));
494
495	spin_lock_bh(&csk->lock);
496	if (csk->retry_timer.function) {
497		del_timer(&csk->retry_timer);
498		csk->retry_timer.function = NULL;
499	}
500
501	if (unlikely(csk->state != CTP_ACTIVE_OPEN))
502		pr_info("csk 0x%p,%u,0x%lx,%u, got EST.\n",
503			csk, csk->state, csk->flags, csk->tid);
504
505	csk->copied_seq = csk->rcv_wup = csk->rcv_nxt = rcv_isn;
506	if (cxgb3i_rcv_win > (M_RCV_BUFSIZ << 10))
507		csk->rcv_wup -= cxgb3i_rcv_win - (M_RCV_BUFSIZ << 10);
508
509	cxgbi_sock_established(csk, ntohl(req->snd_isn), ntohs(req->tcp_opt));
510
511	if (unlikely(cxgbi_sock_flag(csk, CTPF_ACTIVE_CLOSE_NEEDED)))
512		/* upper layer has requested closing */
513		send_abort_req(csk);
514	else {
515		if (skb_queue_len(&csk->write_queue))
516			push_tx_frames(csk, 1);
517		cxgbi_conn_tx_open(csk);
518	}
519
520	spin_unlock_bh(&csk->lock);
521	__kfree_skb(skb);
522	return 0;
523}
524
525/*
526 * Process a CPL_ACT_OPEN_RPL message: -> host
527 * Handle active open failures.
528 */
529static int act_open_rpl_status_to_errno(int status)
530{
531	switch (status) {
532	case CPL_ERR_CONN_RESET:
533		return -ECONNREFUSED;
534	case CPL_ERR_ARP_MISS:
535		return -EHOSTUNREACH;
536	case CPL_ERR_CONN_TIMEDOUT:
537		return -ETIMEDOUT;
538	case CPL_ERR_TCAM_FULL:
539		return -ENOMEM;
540	case CPL_ERR_CONN_EXIST:
541		return -EADDRINUSE;
542	default:
543		return -EIO;
544	}
545}
546
547static void act_open_retry_timer(unsigned long data)
548{
549	struct sk_buff *skb;
550	struct cxgbi_sock *csk = (struct cxgbi_sock *)data;
551
552	log_debug(1 << CXGBI_DBG_TOE | 1 << CXGBI_DBG_SOCK,
553		"csk 0x%p,%u,0x%lx,%u.\n",
554		csk, csk->state, csk->flags, csk->tid);
555
556	cxgbi_sock_get(csk);
557	spin_lock_bh(&csk->lock);
558	skb = alloc_wr(sizeof(struct cpl_act_open_req), 0, GFP_ATOMIC);
559	if (!skb)
560		cxgbi_sock_fail_act_open(csk, -ENOMEM);
561	else {
562		skb->sk = (struct sock *)csk;
563		set_arp_failure_handler(skb, act_open_arp_failure);
564		send_act_open_req(csk, skb, csk->l2t);
565	}
566	spin_unlock_bh(&csk->lock);
567	cxgbi_sock_put(csk);
568}
569
570static int do_act_open_rpl(struct t3cdev *tdev, struct sk_buff *skb, void *ctx)
571{
572	struct cxgbi_sock *csk = ctx;
573	struct cpl_act_open_rpl *rpl = cplhdr(skb);
574
575	pr_info("csk 0x%p,%u,0x%lx,%u, status %u, %pI4:%u-%pI4:%u.\n",
576		csk, csk->state, csk->flags, csk->atid, rpl->status,
577		&csk->saddr.sin_addr.s_addr, ntohs(csk->saddr.sin_port),
578		&csk->daddr.sin_addr.s_addr, ntohs(csk->daddr.sin_port));
579
580	if (rpl->status != CPL_ERR_TCAM_FULL &&
581	    rpl->status != CPL_ERR_CONN_EXIST &&
582	    rpl->status != CPL_ERR_ARP_MISS)
583		cxgb3_queue_tid_release(tdev, GET_TID(rpl));
584
585	cxgbi_sock_get(csk);
586	spin_lock_bh(&csk->lock);
587	if (rpl->status == CPL_ERR_CONN_EXIST &&
588	    csk->retry_timer.function != act_open_retry_timer) {
589		csk->retry_timer.function = act_open_retry_timer;
590		mod_timer(&csk->retry_timer, jiffies + HZ / 2);
591	} else
592		cxgbi_sock_fail_act_open(csk,
593				act_open_rpl_status_to_errno(rpl->status));
594
595	spin_unlock_bh(&csk->lock);
596	cxgbi_sock_put(csk);
597	__kfree_skb(skb);
598	return 0;
599}
600
601/*
602 * Process PEER_CLOSE CPL messages: -> host
603 * Handle peer FIN.
604 */
605static int do_peer_close(struct t3cdev *cdev, struct sk_buff *skb, void *ctx)
606{
607	struct cxgbi_sock *csk = ctx;
608
609	log_debug(1 << CXGBI_DBG_TOE | 1 << CXGBI_DBG_SOCK,
610		"csk 0x%p,%u,0x%lx,%u.\n",
611		csk, csk->state, csk->flags, csk->tid);
612
613	cxgbi_sock_rcv_peer_close(csk);
614	__kfree_skb(skb);
615	return 0;
616}
617
618/*
619 * Process CLOSE_CONN_RPL CPL message: -> host
620 * Process a peer ACK to our FIN.
621 */
622static int do_close_con_rpl(struct t3cdev *cdev, struct sk_buff *skb,
623			    void *ctx)
624{
625	struct cxgbi_sock *csk = ctx;
626	struct cpl_close_con_rpl *rpl = cplhdr(skb);
627
628	log_debug(1 << CXGBI_DBG_TOE | 1 << CXGBI_DBG_SOCK,
629		"csk 0x%p,%u,0x%lx,%u, snxt %u.\n",
630		csk, csk->state, csk->flags, csk->tid, ntohl(rpl->snd_nxt));
631
632	cxgbi_sock_rcv_close_conn_rpl(csk, ntohl(rpl->snd_nxt));
633	__kfree_skb(skb);
634	return 0;
635}
636
637/*
638 * Process ABORT_REQ_RSS CPL message: -> host
639 * Process abort requests.  If we are waiting for an ABORT_RPL we ignore this
640 * request except that we need to reply to it.
641 */
642
643static int abort_status_to_errno(struct cxgbi_sock *csk, int abort_reason,
644				 int *need_rst)
645{
646	switch (abort_reason) {
647	case CPL_ERR_BAD_SYN: /* fall through */
648	case CPL_ERR_CONN_RESET:
649		return csk->state > CTP_ESTABLISHED ? -EPIPE : -ECONNRESET;
650	case CPL_ERR_XMIT_TIMEDOUT:
651	case CPL_ERR_PERSIST_TIMEDOUT:
652	case CPL_ERR_FINWAIT2_TIMEDOUT:
653	case CPL_ERR_KEEPALIVE_TIMEDOUT:
654		return -ETIMEDOUT;
655	default:
656		return -EIO;
657	}
658}
659
660static int do_abort_req(struct t3cdev *cdev, struct sk_buff *skb, void *ctx)
661{
662	const struct cpl_abort_req_rss *req = cplhdr(skb);
663	struct cxgbi_sock *csk = ctx;
664	int rst_status = CPL_ABORT_NO_RST;
665
666	log_debug(1 << CXGBI_DBG_TOE | 1 << CXGBI_DBG_SOCK,
667		"csk 0x%p,%u,0x%lx,%u.\n",
668		csk, csk->state, csk->flags, csk->tid);
669
670	if (req->status == CPL_ERR_RTX_NEG_ADVICE ||
671	    req->status == CPL_ERR_PERSIST_NEG_ADVICE) {
672		goto done;
673	}
674
675	cxgbi_sock_get(csk);
676	spin_lock_bh(&csk->lock);
677
678	if (!cxgbi_sock_flag(csk, CTPF_ABORT_REQ_RCVD)) {
679		cxgbi_sock_set_flag(csk, CTPF_ABORT_REQ_RCVD);
680		cxgbi_sock_set_state(csk, CTP_ABORTING);
681		goto out;
682	}
683
684	cxgbi_sock_clear_flag(csk, CTPF_ABORT_REQ_RCVD);
685	send_abort_rpl(csk, rst_status);
686
687	if (!cxgbi_sock_flag(csk, CTPF_ABORT_RPL_PENDING)) {
688		csk->err = abort_status_to_errno(csk, req->status, &rst_status);
689		cxgbi_sock_closed(csk);
690	}
691
692out:
693	spin_unlock_bh(&csk->lock);
694	cxgbi_sock_put(csk);
695done:
696	__kfree_skb(skb);
697	return 0;
698}
699
700/*
701 * Process ABORT_RPL_RSS CPL message: -> host
702 * Process abort replies.  We only process these messages if we anticipate
703 * them as the coordination between SW and HW in this area is somewhat lacking
704 * and sometimes we get ABORT_RPLs after we are done with the connection that
705 * originated the ABORT_REQ.
706 */
707static int do_abort_rpl(struct t3cdev *cdev, struct sk_buff *skb, void *ctx)
708{
709	struct cpl_abort_rpl_rss *rpl = cplhdr(skb);
710	struct cxgbi_sock *csk = ctx;
711
712	log_debug(1 << CXGBI_DBG_TOE | 1 << CXGBI_DBG_SOCK,
713		"status 0x%x, csk 0x%p, s %u, 0x%lx.\n",
714		rpl->status, csk, csk ? csk->state : 0,
715		csk ? csk->flags : 0UL);
716	/*
717	 * Ignore replies to post-close aborts indicating that the abort was
718	 * requested too late.  These connections are terminated when we get
719	 * PEER_CLOSE or CLOSE_CON_RPL and by the time the abort_rpl_rss
720	 * arrives the TID is either no longer used or it has been recycled.
721	 */
722	if (rpl->status == CPL_ERR_ABORT_FAILED)
723		goto rel_skb;
724	/*
725	 * Sometimes we've already closed the connection, e.g., a post-close
726	 * abort races with ABORT_REQ_RSS, the latter frees the connection
727	 * expecting the ABORT_REQ will fail with CPL_ERR_ABORT_FAILED,
728	 * but FW turns the ABORT_REQ into a regular one and so we get
729	 * ABORT_RPL_RSS with status 0 and no connection.
730	 */
731	if (csk)
732		cxgbi_sock_rcv_abort_rpl(csk);
733rel_skb:
734	__kfree_skb(skb);
735	return 0;
736}
737
738/*
739 * Process RX_ISCSI_HDR CPL message: -> host
740 * Handle received PDUs, the payload could be DDP'ed. If not, the payload
741 * follow after the bhs.
742 */
743static int do_iscsi_hdr(struct t3cdev *t3dev, struct sk_buff *skb, void *ctx)
744{
745	struct cxgbi_sock *csk = ctx;
746	struct cpl_iscsi_hdr *hdr_cpl = cplhdr(skb);
747	struct cpl_iscsi_hdr_norss data_cpl;
748	struct cpl_rx_data_ddp_norss ddp_cpl;
749	unsigned int hdr_len, data_len, status;
750	unsigned int len;
751	int err;
752
753	log_debug(1 << CXGBI_DBG_TOE | 1 << CXGBI_DBG_PDU_RX,
754		"csk 0x%p,%u,0x%lx,%u, skb 0x%p,%u.\n",
755		csk, csk->state, csk->flags, csk->tid, skb, skb->len);
756
757	spin_lock_bh(&csk->lock);
758
759	if (unlikely(csk->state >= CTP_PASSIVE_CLOSE)) {
760		log_debug(1 << CXGBI_DBG_TOE | 1 << CXGBI_DBG_SOCK,
761			"csk 0x%p,%u,0x%lx,%u, bad state.\n",
762			csk, csk->state, csk->flags, csk->tid);
763		if (csk->state != CTP_ABORTING)
764			goto abort_conn;
765		else
766			goto discard;
767	}
768
769	cxgbi_skcb_tcp_seq(skb) = ntohl(hdr_cpl->seq);
770	cxgbi_skcb_flags(skb) = 0;
771
772	skb_reset_transport_header(skb);
773	__skb_pull(skb, sizeof(struct cpl_iscsi_hdr));
774
775	len = hdr_len = ntohs(hdr_cpl->len);
776	/* msg coalesce is off or not enough data received */
777	if (skb->len <= hdr_len) {
778		pr_err("%s: tid %u, CPL_ISCSI_HDR, skb len %u < %u.\n",
779			csk->cdev->ports[csk->port_id]->name, csk->tid,
780			skb->len, hdr_len);
781		goto abort_conn;
782	}
783	cxgbi_skcb_set_flag(skb, SKCBF_RX_COALESCED);
784
785	err = skb_copy_bits(skb, skb->len - sizeof(ddp_cpl), &ddp_cpl,
786			    sizeof(ddp_cpl));
787	if (err < 0) {
788		pr_err("%s: tid %u, copy cpl_ddp %u-%zu failed %d.\n",
789			csk->cdev->ports[csk->port_id]->name, csk->tid,
790			skb->len, sizeof(ddp_cpl), err);
791		goto abort_conn;
792	}
793
794	cxgbi_skcb_set_flag(skb, SKCBF_RX_STATUS);
795	cxgbi_skcb_rx_pdulen(skb) = ntohs(ddp_cpl.len);
796	cxgbi_skcb_rx_ddigest(skb) = ntohl(ddp_cpl.ulp_crc);
797	status = ntohl(ddp_cpl.ddp_status);
798
799	log_debug(1 << CXGBI_DBG_TOE | 1 << CXGBI_DBG_PDU_RX,
800		"csk 0x%p, skb 0x%p,%u, pdulen %u, status 0x%x.\n",
801		csk, skb, skb->len, cxgbi_skcb_rx_pdulen(skb), status);
802
803	if (status & (1 << CPL_RX_DDP_STATUS_HCRC_SHIFT))
804		cxgbi_skcb_set_flag(skb, SKCBF_RX_HCRC_ERR);
805	if (status & (1 << CPL_RX_DDP_STATUS_DCRC_SHIFT))
806		cxgbi_skcb_set_flag(skb, SKCBF_RX_DCRC_ERR);
807	if (status & (1 << CPL_RX_DDP_STATUS_PAD_SHIFT))
808		cxgbi_skcb_set_flag(skb, SKCBF_RX_PAD_ERR);
809
810	if (skb->len > (hdr_len + sizeof(ddp_cpl))) {
811		err = skb_copy_bits(skb, hdr_len, &data_cpl, sizeof(data_cpl));
812		if (err < 0) {
813			pr_err("%s: tid %u, cp %zu/%u failed %d.\n",
814				csk->cdev->ports[csk->port_id]->name,
815				csk->tid, sizeof(data_cpl), skb->len, err);
816			goto abort_conn;
817		}
818		data_len = ntohs(data_cpl.len);
819		log_debug(1 << CXGBI_DBG_DDP | 1 << CXGBI_DBG_PDU_RX,
820			"skb 0x%p, pdu not ddp'ed %u/%u, status 0x%x.\n",
821			skb, data_len, cxgbi_skcb_rx_pdulen(skb), status);
822		len += sizeof(data_cpl) + data_len;
823	} else if (status & (1 << CPL_RX_DDP_STATUS_DDP_SHIFT))
824		cxgbi_skcb_set_flag(skb, SKCBF_RX_DATA_DDPD);
825
826	csk->rcv_nxt = ntohl(ddp_cpl.seq) + cxgbi_skcb_rx_pdulen(skb);
827	__pskb_trim(skb, len);
828	__skb_queue_tail(&csk->receive_queue, skb);
829	cxgbi_conn_pdu_ready(csk);
830
831	spin_unlock_bh(&csk->lock);
832	return 0;
833
834abort_conn:
835	send_abort_req(csk);
836discard:
837	spin_unlock_bh(&csk->lock);
838	__kfree_skb(skb);
839	return 0;
840}
841
842/*
843 * Process TX_DATA_ACK CPL messages: -> host
844 * Process an acknowledgment of WR completion.  Advance snd_una and send the
845 * next batch of work requests from the write queue.
846 */
847static int do_wr_ack(struct t3cdev *cdev, struct sk_buff *skb, void *ctx)
848{
849	struct cxgbi_sock *csk = ctx;
850	struct cpl_wr_ack *hdr = cplhdr(skb);
851
852	log_debug(1 << CXGBI_DBG_TOE | 1 << CXGBI_DBG_PDU_RX,
853		"csk 0x%p,%u,0x%lx,%u, cr %u.\n",
854		csk, csk->state, csk->flags, csk->tid, ntohs(hdr->credits));
855
856	cxgbi_sock_rcv_wr_ack(csk, ntohs(hdr->credits), ntohl(hdr->snd_una), 1);
857	__kfree_skb(skb);
858	return 0;
859}
860
861/*
862 * for each connection, pre-allocate skbs needed for close/abort requests. So
863 * that we can service the request right away.
864 */
865static int alloc_cpls(struct cxgbi_sock *csk)
866{
867	csk->cpl_close = alloc_wr(sizeof(struct cpl_close_con_req), 0,
868					GFP_KERNEL);
869	if (!csk->cpl_close)
870		return -ENOMEM;
871	csk->cpl_abort_req = alloc_wr(sizeof(struct cpl_abort_req), 0,
872					GFP_KERNEL);
873	if (!csk->cpl_abort_req)
874		goto free_cpl_skbs;
875
876	csk->cpl_abort_rpl = alloc_wr(sizeof(struct cpl_abort_rpl), 0,
877					GFP_KERNEL);
878	if (!csk->cpl_abort_rpl)
879		goto free_cpl_skbs;
880
881	return 0;
882
883free_cpl_skbs:
884	cxgbi_sock_free_cpl_skbs(csk);
885	return -ENOMEM;
886}
887
888/**
889 * release_offload_resources - release offload resource
890 * @c3cn: the offloaded iscsi tcp connection.
891 * Release resources held by an offload connection (TID, L2T entry, etc.)
892 */
893static void l2t_put(struct cxgbi_sock *csk)
894{
895	struct t3cdev *t3dev = (struct t3cdev *)csk->cdev->lldev;
896
897	if (csk->l2t) {
898		l2t_release(t3dev, csk->l2t);
899		csk->l2t = NULL;
900		cxgbi_sock_put(csk);
901	}
902}
903
904static void release_offload_resources(struct cxgbi_sock *csk)
905{
906	struct t3cdev *t3dev = (struct t3cdev *)csk->cdev->lldev;
907
908	log_debug(1 << CXGBI_DBG_TOE | 1 << CXGBI_DBG_SOCK,
909		"csk 0x%p,%u,0x%lx,%u.\n",
910		csk, csk->state, csk->flags, csk->tid);
911
912	csk->rss_qid = 0;
913	cxgbi_sock_free_cpl_skbs(csk);
914
915	if (csk->wr_cred != csk->wr_max_cred) {
916		cxgbi_sock_purge_wr_queue(csk);
917		cxgbi_sock_reset_wr_list(csk);
918	}
919	l2t_put(csk);
920	if (cxgbi_sock_flag(csk, CTPF_HAS_ATID))
921		free_atid(csk);
922	else if (cxgbi_sock_flag(csk, CTPF_HAS_TID)) {
923		cxgb3_remove_tid(t3dev, (void *)csk, csk->tid);
924		cxgbi_sock_clear_flag(csk, CTPF_HAS_TID);
925		cxgbi_sock_put(csk);
926	}
927	csk->dst = NULL;
928	csk->cdev = NULL;
929}
930
931static void update_address(struct cxgbi_hba *chba)
932{
933	if (chba->ipv4addr) {
934		if (chba->vdev &&
935		    chba->ipv4addr != cxgb3i_get_private_ipv4addr(chba->vdev)) {
936			cxgb3i_set_private_ipv4addr(chba->vdev, chba->ipv4addr);
937			cxgb3i_set_private_ipv4addr(chba->ndev, 0);
938			pr_info("%s set %pI4.\n",
939				chba->vdev->name, &chba->ipv4addr);
940		} else if (chba->ipv4addr !=
941				cxgb3i_get_private_ipv4addr(chba->ndev)) {
942			cxgb3i_set_private_ipv4addr(chba->ndev, chba->ipv4addr);
943			pr_info("%s set %pI4.\n",
944				chba->ndev->name, &chba->ipv4addr);
945		}
946	} else if (cxgb3i_get_private_ipv4addr(chba->ndev)) {
947		if (chba->vdev)
948			cxgb3i_set_private_ipv4addr(chba->vdev, 0);
949		cxgb3i_set_private_ipv4addr(chba->ndev, 0);
950	}
951}
952
953static int init_act_open(struct cxgbi_sock *csk)
954{
955	struct dst_entry *dst = csk->dst;
956	struct cxgbi_device *cdev = csk->cdev;
957	struct t3cdev *t3dev = (struct t3cdev *)cdev->lldev;
958	struct net_device *ndev = cdev->ports[csk->port_id];
959	struct cxgbi_hba *chba = cdev->hbas[csk->port_id];
960	struct sk_buff *skb = NULL;
961
962	log_debug(1 << CXGBI_DBG_TOE | 1 << CXGBI_DBG_SOCK,
963		"csk 0x%p,%u,0x%lx.\n", csk, csk->state, csk->flags);
964
965	update_address(chba);
966	if (chba->ipv4addr)
967		csk->saddr.sin_addr.s_addr = chba->ipv4addr;
968
969	csk->rss_qid = 0;
970	csk->l2t = t3_l2t_get(t3dev, dst, ndev,
971			      &csk->daddr.sin_addr.s_addr);
972	if (!csk->l2t) {
973		pr_err("NO l2t available.\n");
974		return -EINVAL;
975	}
976	cxgbi_sock_get(csk);
977
978	csk->atid = cxgb3_alloc_atid(t3dev, &t3_client, csk);
979	if (csk->atid < 0) {
980		pr_err("NO atid available.\n");
981		goto rel_resource;
982	}
983	cxgbi_sock_set_flag(csk, CTPF_HAS_ATID);
984	cxgbi_sock_get(csk);
985
986	skb = alloc_wr(sizeof(struct cpl_act_open_req), 0, GFP_KERNEL);
987	if (!skb)
988		goto rel_resource;
989	skb->sk = (struct sock *)csk;
990	set_arp_failure_handler(skb, act_open_arp_failure);
991
992	csk->wr_max_cred = csk->wr_cred = T3C_DATA(t3dev)->max_wrs - 1;
993	csk->wr_una_cred = 0;
994	csk->mss_idx = cxgbi_sock_select_mss(csk, dst_mtu(dst));
995	cxgbi_sock_reset_wr_list(csk);
996	csk->err = 0;
997
998	log_debug(1 << CXGBI_DBG_TOE | 1 << CXGBI_DBG_SOCK,
999		"csk 0x%p,%u,0x%lx, %pI4:%u-%pI4:%u.\n",
1000		csk, csk->state, csk->flags,
1001		&csk->saddr.sin_addr.s_addr, ntohs(csk->saddr.sin_port),
1002		&csk->daddr.sin_addr.s_addr, ntohs(csk->daddr.sin_port));
1003
1004	cxgbi_sock_set_state(csk, CTP_ACTIVE_OPEN);
1005	send_act_open_req(csk, skb, csk->l2t);
1006	return 0;
1007
1008rel_resource:
1009	if (skb)
1010		__kfree_skb(skb);
1011	return -EINVAL;
1012}
1013
1014cxgb3_cpl_handler_func cxgb3i_cpl_handlers[NUM_CPL_CMDS] = {
1015	[CPL_ACT_ESTABLISH] = do_act_establish,
1016	[CPL_ACT_OPEN_RPL] = do_act_open_rpl,
1017	[CPL_PEER_CLOSE] = do_peer_close,
1018	[CPL_ABORT_REQ_RSS] = do_abort_req,
1019	[CPL_ABORT_RPL_RSS] = do_abort_rpl,
1020	[CPL_CLOSE_CON_RPL] = do_close_con_rpl,
1021	[CPL_TX_DMA_ACK] = do_wr_ack,
1022	[CPL_ISCSI_HDR] = do_iscsi_hdr,
1023};
1024
1025/**
1026 * cxgb3i_ofld_init - allocate and initialize resources for each adapter found
1027 * @cdev:	cxgbi adapter
1028 */
1029int cxgb3i_ofld_init(struct cxgbi_device *cdev)
1030{
1031	struct t3cdev *t3dev = (struct t3cdev *)cdev->lldev;
1032	struct adap_ports port;
1033	struct ofld_page_info rx_page_info;
1034	unsigned int wr_len;
1035	int rc;
1036
1037	if (t3dev->ctl(t3dev, GET_WR_LEN, &wr_len) < 0 ||
1038	    t3dev->ctl(t3dev, GET_PORTS, &port) < 0 ||
1039	    t3dev->ctl(t3dev, GET_RX_PAGE_INFO, &rx_page_info) < 0) {
1040		pr_warn("t3 0x%p, offload up, ioctl failed.\n", t3dev);
1041		return -EINVAL;
1042	}
1043
1044	if (cxgb3i_max_connect > CXGBI_MAX_CONN)
1045		cxgb3i_max_connect = CXGBI_MAX_CONN;
1046
1047	rc = cxgbi_device_portmap_create(cdev, cxgb3i_sport_base,
1048					cxgb3i_max_connect);
1049	if (rc < 0)
1050		return rc;
1051
1052	init_wr_tab(wr_len);
1053	cdev->csk_release_offload_resources = release_offload_resources;
1054	cdev->csk_push_tx_frames = push_tx_frames;
1055	cdev->csk_send_abort_req = send_abort_req;
1056	cdev->csk_send_close_req = send_close_req;
1057	cdev->csk_send_rx_credits = send_rx_credits;
1058	cdev->csk_alloc_cpls = alloc_cpls;
1059	cdev->csk_init_act_open = init_act_open;
1060
1061	pr_info("cdev 0x%p, offload up, added.\n", cdev);
1062	return 0;
1063}
1064
1065/*
1066 * functions to program the pagepod in h/w
1067 */
1068static inline void ulp_mem_io_set_hdr(struct sk_buff *skb, unsigned int addr)
1069{
1070	struct ulp_mem_io *req = (struct ulp_mem_io *)skb->head;
1071
1072	memset(req, 0, sizeof(*req));
1073
1074	req->wr.wr_hi = htonl(V_WR_OP(FW_WROPCODE_BYPASS));
1075	req->cmd_lock_addr = htonl(V_ULP_MEMIO_ADDR(addr >> 5) |
1076				   V_ULPTX_CMD(ULP_MEM_WRITE));
1077	req->len = htonl(V_ULP_MEMIO_DATA_LEN(PPOD_SIZE >> 5) |
1078			 V_ULPTX_NFLITS((PPOD_SIZE >> 3) + 1));
1079}
1080
1081static int ddp_set_map(struct cxgbi_sock *csk, struct cxgbi_pagepod_hdr *hdr,
1082			unsigned int idx, unsigned int npods,
1083				struct cxgbi_gather_list *gl)
1084{
1085	struct cxgbi_device *cdev = csk->cdev;
1086	struct cxgbi_ddp_info *ddp = cdev->ddp;
1087	unsigned int pm_addr = (idx << PPOD_SIZE_SHIFT) + ddp->llimit;
1088	int i;
1089
1090	log_debug(1 << CXGBI_DBG_DDP,
1091		"csk 0x%p, idx %u, npods %u, gl 0x%p.\n",
1092		csk, idx, npods, gl);
1093
1094	for (i = 0; i < npods; i++, idx++, pm_addr += PPOD_SIZE) {
1095		struct sk_buff *skb = alloc_wr(sizeof(struct ulp_mem_io) +
1096						PPOD_SIZE, 0, GFP_ATOMIC);
1097
1098		if (!skb)
1099			return -ENOMEM;
1100
1101		ulp_mem_io_set_hdr(skb, pm_addr);
1102		cxgbi_ddp_ppod_set((struct cxgbi_pagepod *)(skb->head +
1103					sizeof(struct ulp_mem_io)),
1104				   hdr, gl, i * PPOD_PAGES_MAX);
1105		skb->priority = CPL_PRIORITY_CONTROL;
1106		cxgb3_ofld_send(cdev->lldev, skb);
1107	}
1108	return 0;
1109}
1110
1111static void ddp_clear_map(struct cxgbi_hba *chba, unsigned int tag,
1112			  unsigned int idx, unsigned int npods)
1113{
1114	struct cxgbi_device *cdev = chba->cdev;
1115	struct cxgbi_ddp_info *ddp = cdev->ddp;
1116	unsigned int pm_addr = (idx << PPOD_SIZE_SHIFT) + ddp->llimit;
1117	int i;
1118
1119	log_debug(1 << CXGBI_DBG_DDP,
1120		"cdev 0x%p, idx %u, npods %u, tag 0x%x.\n",
1121		cdev, idx, npods, tag);
1122
1123	for (i = 0; i < npods; i++, idx++, pm_addr += PPOD_SIZE) {
1124		struct sk_buff *skb = alloc_wr(sizeof(struct ulp_mem_io) +
1125						PPOD_SIZE, 0, GFP_ATOMIC);
1126
1127		if (!skb) {
1128			pr_err("tag 0x%x, 0x%x, %d/%u, skb OOM.\n",
1129				tag, idx, i, npods);
1130			continue;
1131		}
1132		ulp_mem_io_set_hdr(skb, pm_addr);
1133		skb->priority = CPL_PRIORITY_CONTROL;
1134		cxgb3_ofld_send(cdev->lldev, skb);
1135	}
1136}
1137
1138static int ddp_setup_conn_pgidx(struct cxgbi_sock *csk,
1139				       unsigned int tid, int pg_idx, bool reply)
1140{
1141	struct sk_buff *skb = alloc_wr(sizeof(struct cpl_set_tcb_field), 0,
1142					GFP_KERNEL);
1143	struct cpl_set_tcb_field *req;
1144	u64 val = pg_idx < DDP_PGIDX_MAX ? pg_idx : 0;
1145
1146	log_debug(1 << CXGBI_DBG_DDP,
1147		"csk 0x%p, tid %u, pg_idx %d.\n", csk, tid, pg_idx);
1148	if (!skb)
1149		return -ENOMEM;
1150
1151	/* set up ulp submode and page size */
1152	req = (struct cpl_set_tcb_field *)skb->head;
1153	req->wr.wr_hi = htonl(V_WR_OP(FW_WROPCODE_FORWARD));
1154	OPCODE_TID(req) = htonl(MK_OPCODE_TID(CPL_SET_TCB_FIELD, tid));
1155	req->reply = V_NO_REPLY(reply ? 0 : 1);
1156	req->cpu_idx = 0;
1157	req->word = htons(31);
1158	req->mask = cpu_to_be64(0xF0000000);
1159	req->val = cpu_to_be64(val << 28);
1160	skb->priority = CPL_PRIORITY_CONTROL;
1161
1162	cxgb3_ofld_send(csk->cdev->lldev, skb);
1163	return 0;
1164}
1165
1166/**
1167 * cxgb3i_setup_conn_digest - setup conn. digest setting
1168 * @csk: cxgb tcp socket
1169 * @tid: connection id
1170 * @hcrc: header digest enabled
1171 * @dcrc: data digest enabled
1172 * @reply: request reply from h/w
1173 * set up the iscsi digest settings for a connection identified by tid
1174 */
1175static int ddp_setup_conn_digest(struct cxgbi_sock *csk, unsigned int tid,
1176			     int hcrc, int dcrc, int reply)
1177{
1178	struct sk_buff *skb = alloc_wr(sizeof(struct cpl_set_tcb_field), 0,
1179					GFP_KERNEL);
1180	struct cpl_set_tcb_field *req;
1181	u64 val = (hcrc ? 1 : 0) | (dcrc ? 2 : 0);
1182
1183	log_debug(1 << CXGBI_DBG_DDP,
1184		"csk 0x%p, tid %u, crc %d,%d.\n", csk, tid, hcrc, dcrc);
1185	if (!skb)
1186		return -ENOMEM;
1187
1188	/* set up ulp submode and page size */
1189	req = (struct cpl_set_tcb_field *)skb->head;
1190	req->wr.wr_hi = htonl(V_WR_OP(FW_WROPCODE_FORWARD));
1191	OPCODE_TID(req) = htonl(MK_OPCODE_TID(CPL_SET_TCB_FIELD, tid));
1192	req->reply = V_NO_REPLY(reply ? 0 : 1);
1193	req->cpu_idx = 0;
1194	req->word = htons(31);
1195	req->mask = cpu_to_be64(0x0F000000);
1196	req->val = cpu_to_be64(val << 24);
1197	skb->priority = CPL_PRIORITY_CONTROL;
1198
1199	cxgb3_ofld_send(csk->cdev->lldev, skb);
1200	return 0;
1201}
1202
1203/**
1204 * t3_ddp_cleanup - release the cxgb3 adapter's ddp resource
1205 * @cdev: cxgb3i adapter
1206 * release all the resource held by the ddp pagepod manager for a given
1207 * adapter if needed
1208 */
1209
1210static void t3_ddp_cleanup(struct cxgbi_device *cdev)
1211{
1212	struct t3cdev *tdev = (struct t3cdev *)cdev->lldev;
1213
1214	if (cxgbi_ddp_cleanup(cdev)) {
1215		pr_info("t3dev 0x%p, ulp_iscsi no more user.\n", tdev);
1216		tdev->ulp_iscsi = NULL;
1217	}
1218}
1219
1220/**
1221 * ddp_init - initialize the cxgb3 adapter's ddp resource
1222 * @cdev: cxgb3i adapter
1223 * initialize the ddp pagepod manager for a given adapter
1224 */
1225static int cxgb3i_ddp_init(struct cxgbi_device *cdev)
1226{
1227	struct t3cdev *tdev = (struct t3cdev *)cdev->lldev;
1228	struct cxgbi_ddp_info *ddp = tdev->ulp_iscsi;
1229	struct ulp_iscsi_info uinfo;
1230	unsigned int pgsz_factor[4];
1231	int i, err;
1232
1233	if (ddp) {
1234		kref_get(&ddp->refcnt);
1235		pr_warn("t3dev 0x%p, ddp 0x%p already set up.\n",
1236			tdev, tdev->ulp_iscsi);
1237		cdev->ddp = ddp;
1238		return -EALREADY;
1239	}
1240
1241	err = tdev->ctl(tdev, ULP_ISCSI_GET_PARAMS, &uinfo);
1242	if (err < 0) {
1243		pr_err("%s, failed to get iscsi param err=%d.\n",
1244			 tdev->name, err);
1245		return err;
1246	}
1247
1248	err = cxgbi_ddp_init(cdev, uinfo.llimit, uinfo.ulimit,
1249			uinfo.max_txsz, uinfo.max_rxsz);
1250	if (err < 0)
1251		return err;
1252
1253	ddp = cdev->ddp;
1254
1255	uinfo.tagmask = ddp->idx_mask << PPOD_IDX_SHIFT;
1256	cxgbi_ddp_page_size_factor(pgsz_factor);
1257	for (i = 0; i < 4; i++)
1258		uinfo.pgsz_factor[i] = pgsz_factor[i];
1259	uinfo.ulimit = uinfo.llimit + (ddp->nppods << PPOD_SIZE_SHIFT);
1260
1261	err = tdev->ctl(tdev, ULP_ISCSI_SET_PARAMS, &uinfo);
1262	if (err < 0) {
1263		pr_warn("%s unable to set iscsi param err=%d, ddp disabled.\n",
1264			tdev->name, err);
1265		cxgbi_ddp_cleanup(cdev);
1266		return err;
1267	}
1268	tdev->ulp_iscsi = ddp;
1269
1270	cdev->csk_ddp_setup_digest = ddp_setup_conn_digest;
1271	cdev->csk_ddp_setup_pgidx = ddp_setup_conn_pgidx;
1272	cdev->csk_ddp_set = ddp_set_map;
1273	cdev->csk_ddp_clear = ddp_clear_map;
1274
1275	pr_info("tdev 0x%p, nppods %u, bits %u, mask 0x%x,0x%x pkt %u/%u, "
1276		"%u/%u.\n",
1277		tdev, ddp->nppods, ddp->idx_bits, ddp->idx_mask,
1278		ddp->rsvd_tag_mask, ddp->max_txsz, uinfo.max_txsz,
1279		ddp->max_rxsz, uinfo.max_rxsz);
1280	return 0;
1281}
1282
1283static void cxgb3i_dev_close(struct t3cdev *t3dev)
1284{
1285	struct cxgbi_device *cdev = cxgbi_device_find_by_lldev(t3dev);
1286
1287	if (!cdev || cdev->flags & CXGBI_FLAG_ADAPTER_RESET) {
1288		pr_info("0x%p close, f 0x%x.\n", cdev, cdev ? cdev->flags : 0);
1289		return;
1290	}
1291
1292	cxgbi_device_unregister(cdev);
1293}
1294
1295/**
1296 * cxgb3i_dev_open - init a t3 adapter structure and any h/w settings
1297 * @t3dev: t3cdev adapter
1298 */
1299static void cxgb3i_dev_open(struct t3cdev *t3dev)
1300{
1301	struct cxgbi_device *cdev = cxgbi_device_find_by_lldev(t3dev);
1302	struct adapter *adapter = tdev2adap(t3dev);
1303	int i, err;
1304
1305	if (cdev) {
1306		pr_info("0x%p, updating.\n", cdev);
1307		return;
1308	}
1309
1310	cdev = cxgbi_device_register(0, adapter->params.nports);
1311	if (!cdev) {
1312		pr_warn("device 0x%p register failed.\n", t3dev);
1313		return;
1314	}
1315
1316	cdev->flags = CXGBI_FLAG_DEV_T3 | CXGBI_FLAG_IPV4_SET;
1317	cdev->lldev = t3dev;
1318	cdev->pdev = adapter->pdev;
1319	cdev->ports = adapter->port;
1320	cdev->nports = adapter->params.nports;
1321	cdev->mtus = adapter->params.mtus;
1322	cdev->nmtus = NMTUS;
1323	cdev->snd_win = cxgb3i_snd_win;
1324	cdev->rcv_win = cxgb3i_rcv_win;
1325	cdev->rx_credit_thres = cxgb3i_rx_credit_thres;
1326	cdev->skb_tx_rsvd = CXGB3I_TX_HEADER_LEN;
1327	cdev->skb_rx_extra = sizeof(struct cpl_iscsi_hdr_norss);
1328	cdev->dev_ddp_cleanup = t3_ddp_cleanup;
1329	cdev->itp = &cxgb3i_iscsi_transport;
1330
1331	err = cxgb3i_ddp_init(cdev);
1332	if (err) {
1333		pr_info("0x%p ddp init failed\n", cdev);
1334		goto err_out;
1335	}
1336
1337	err = cxgb3i_ofld_init(cdev);
1338	if (err) {
1339		pr_info("0x%p offload init failed\n", cdev);
1340		goto err_out;
1341	}
1342
1343	err = cxgbi_hbas_add(cdev, CXGB3I_MAX_LUN, CXGBI_MAX_CONN,
1344				&cxgb3i_host_template, cxgb3i_stt);
1345	if (err)
1346		goto err_out;
1347
1348	for (i = 0; i < cdev->nports; i++)
1349		cdev->hbas[i]->ipv4addr =
1350			cxgb3i_get_private_ipv4addr(cdev->ports[i]);
1351
1352	pr_info("cdev 0x%p, f 0x%x, t3dev 0x%p open, err %d.\n",
1353		cdev, cdev ? cdev->flags : 0, t3dev, err);
1354	return;
1355
1356err_out:
1357	cxgbi_device_unregister(cdev);
1358}
1359
1360static void cxgb3i_dev_event_handler(struct t3cdev *t3dev, u32 event, u32 port)
1361{
1362	struct cxgbi_device *cdev = cxgbi_device_find_by_lldev(t3dev);
1363
1364	log_debug(1 << CXGBI_DBG_TOE,
1365		"0x%p, cdev 0x%p, event 0x%x, port 0x%x.\n",
1366		t3dev, cdev, event, port);
1367	if (!cdev)
1368		return;
1369
1370	switch (event) {
1371	case OFFLOAD_STATUS_DOWN:
1372		cdev->flags |= CXGBI_FLAG_ADAPTER_RESET;
1373		break;
1374	case OFFLOAD_STATUS_UP:
1375		cdev->flags &= ~CXGBI_FLAG_ADAPTER_RESET;
1376		break;
1377	}
1378}
1379
1380/**
1381 * cxgb3i_init_module - module init entry point
1382 *
1383 * initialize any driver wide global data structures and register itself
1384 *	with the cxgb3 module
1385 */
1386static int __init cxgb3i_init_module(void)
1387{
1388	int rc;
1389
1390	printk(KERN_INFO "%s", version);
1391
1392	rc = cxgbi_iscsi_init(&cxgb3i_iscsi_transport, &cxgb3i_stt);
1393	if (rc < 0)
1394		return rc;
1395
1396	cxgb3_register_client(&t3_client);
1397	return 0;
1398}
1399
1400/**
1401 * cxgb3i_exit_module - module cleanup/exit entry point
1402 *
1403 * go through the driver hba list and for each hba, release any resource held.
1404 *	and unregisters iscsi transport and the cxgb3 module
1405 */
1406static void __exit cxgb3i_exit_module(void)
1407{
1408	cxgb3_unregister_client(&t3_client);
1409	cxgbi_device_unregister_all(CXGBI_FLAG_DEV_T3);
1410	cxgbi_iscsi_cleanup(&cxgb3i_iscsi_transport, &cxgb3i_stt);
1411}
1412
1413module_init(cxgb3i_init_module);
1414module_exit(cxgb3i_exit_module);
1415