cq.c (13281B)
1/* 2 * Copyright (c) 2004, 2005 Topspin Communications. All rights reserved. 3 * Copyright (c) 2005 Sun Microsystems, Inc. All rights reserved. 4 * Copyright (c) 2005, 2006, 2007 Cisco Systems, Inc. All rights reserved. 5 * Copyright (c) 2005, 2006, 2007, 2008 Mellanox Technologies. All rights reserved. 6 * Copyright (c) 2004 Voltaire, Inc. All rights reserved. 7 * 8 * This software is available to you under a choice of one of two 9 * licenses. You may choose to be licensed under the terms of the GNU 10 * General Public License (GPL) Version 2, available from the file 11 * COPYING in the main directory of this source tree, or the 12 * OpenIB.org BSD license below: 13 * 14 * Redistribution and use in source and binary forms, with or 15 * without modification, are permitted provided that the following 16 * conditions are met: 17 * 18 * - Redistributions of source code must retain the above 19 * copyright notice, this list of conditions and the following 20 * disclaimer. 21 * 22 * - Redistributions in binary form must reproduce the above 23 * copyright notice, this list of conditions and the following 24 * disclaimer in the documentation and/or other materials 25 * provided with the distribution. 26 * 27 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 28 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 29 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND 30 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS 31 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN 32 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN 33 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 34 * SOFTWARE. 35 */ 36 37#include <linux/hardirq.h> 38#include <linux/export.h> 39 40#include <linux/mlx4/cmd.h> 41#include <linux/mlx4/cq.h> 42 43#include "mlx4.h" 44#include "icm.h" 45 46#define MLX4_CQ_STATUS_OK ( 0 << 28) 47#define MLX4_CQ_STATUS_OVERFLOW ( 9 << 28) 48#define MLX4_CQ_STATUS_WRITE_FAIL (10 << 28) 49#define MLX4_CQ_FLAG_CC ( 1 << 18) 50#define MLX4_CQ_FLAG_OI ( 1 << 17) 51#define MLX4_CQ_STATE_ARMED ( 9 << 8) 52#define MLX4_CQ_STATE_ARMED_SOL ( 6 << 8) 53#define MLX4_EQ_STATE_FIRED (10 << 8) 54 55#define TASKLET_MAX_TIME 2 56#define TASKLET_MAX_TIME_JIFFIES msecs_to_jiffies(TASKLET_MAX_TIME) 57 58void mlx4_cq_tasklet_cb(struct tasklet_struct *t) 59{ 60 unsigned long flags; 61 unsigned long end = jiffies + TASKLET_MAX_TIME_JIFFIES; 62 struct mlx4_eq_tasklet *ctx = from_tasklet(ctx, t, task); 63 struct mlx4_cq *mcq, *temp; 64 65 spin_lock_irqsave(&ctx->lock, flags); 66 list_splice_tail_init(&ctx->list, &ctx->process_list); 67 spin_unlock_irqrestore(&ctx->lock, flags); 68 69 list_for_each_entry_safe(mcq, temp, &ctx->process_list, tasklet_ctx.list) { 70 list_del_init(&mcq->tasklet_ctx.list); 71 mcq->tasklet_ctx.comp(mcq); 72 if (refcount_dec_and_test(&mcq->refcount)) 73 complete(&mcq->free); 74 if (time_after(jiffies, end)) 75 break; 76 } 77 78 if (!list_empty(&ctx->process_list)) 79 tasklet_schedule(&ctx->task); 80} 81 82static void mlx4_add_cq_to_tasklet(struct mlx4_cq *cq) 83{ 84 struct mlx4_eq_tasklet *tasklet_ctx = cq->tasklet_ctx.priv; 85 unsigned long flags; 86 bool kick; 87 88 spin_lock_irqsave(&tasklet_ctx->lock, flags); 89 /* When migrating CQs between EQs will be implemented, please note 90 * that you need to sync this point. It is possible that 91 * while migrating a CQ, completions on the old EQs could 92 * still arrive. 93 */ 94 if (list_empty_careful(&cq->tasklet_ctx.list)) { 95 refcount_inc(&cq->refcount); 96 kick = list_empty(&tasklet_ctx->list); 97 list_add_tail(&cq->tasklet_ctx.list, &tasklet_ctx->list); 98 if (kick) 99 tasklet_schedule(&tasklet_ctx->task); 100 } 101 spin_unlock_irqrestore(&tasklet_ctx->lock, flags); 102} 103 104void mlx4_cq_completion(struct mlx4_dev *dev, u32 cqn) 105{ 106 struct mlx4_cq *cq; 107 108 rcu_read_lock(); 109 cq = radix_tree_lookup(&mlx4_priv(dev)->cq_table.tree, 110 cqn & (dev->caps.num_cqs - 1)); 111 rcu_read_unlock(); 112 113 if (!cq) { 114 mlx4_dbg(dev, "Completion event for bogus CQ %08x\n", cqn); 115 return; 116 } 117 118 /* Acessing the CQ outside of rcu_read_lock is safe, because 119 * the CQ is freed only after interrupt handling is completed. 120 */ 121 ++cq->arm_sn; 122 123 cq->comp(cq); 124} 125 126void mlx4_cq_event(struct mlx4_dev *dev, u32 cqn, int event_type) 127{ 128 struct mlx4_cq_table *cq_table = &mlx4_priv(dev)->cq_table; 129 struct mlx4_cq *cq; 130 131 rcu_read_lock(); 132 cq = radix_tree_lookup(&cq_table->tree, cqn & (dev->caps.num_cqs - 1)); 133 rcu_read_unlock(); 134 135 if (!cq) { 136 mlx4_dbg(dev, "Async event for bogus CQ %08x\n", cqn); 137 return; 138 } 139 140 /* Acessing the CQ outside of rcu_read_lock is safe, because 141 * the CQ is freed only after interrupt handling is completed. 142 */ 143 cq->event(cq, event_type); 144} 145 146static int mlx4_SW2HW_CQ(struct mlx4_dev *dev, struct mlx4_cmd_mailbox *mailbox, 147 int cq_num, u8 opmod) 148{ 149 return mlx4_cmd(dev, mailbox->dma, cq_num, opmod, 150 MLX4_CMD_SW2HW_CQ, MLX4_CMD_TIME_CLASS_A, 151 MLX4_CMD_WRAPPED); 152} 153 154static int mlx4_MODIFY_CQ(struct mlx4_dev *dev, struct mlx4_cmd_mailbox *mailbox, 155 int cq_num, u32 opmod) 156{ 157 return mlx4_cmd(dev, mailbox->dma, cq_num, opmod, MLX4_CMD_MODIFY_CQ, 158 MLX4_CMD_TIME_CLASS_A, MLX4_CMD_WRAPPED); 159} 160 161static int mlx4_HW2SW_CQ(struct mlx4_dev *dev, struct mlx4_cmd_mailbox *mailbox, 162 int cq_num) 163{ 164 return mlx4_cmd_box(dev, 0, mailbox ? mailbox->dma : 0, 165 cq_num, mailbox ? 0 : 1, MLX4_CMD_HW2SW_CQ, 166 MLX4_CMD_TIME_CLASS_A, MLX4_CMD_WRAPPED); 167} 168 169int mlx4_cq_modify(struct mlx4_dev *dev, struct mlx4_cq *cq, 170 u16 count, u16 period) 171{ 172 struct mlx4_cmd_mailbox *mailbox; 173 struct mlx4_cq_context *cq_context; 174 int err; 175 176 mailbox = mlx4_alloc_cmd_mailbox(dev); 177 if (IS_ERR(mailbox)) 178 return PTR_ERR(mailbox); 179 180 cq_context = mailbox->buf; 181 cq_context->cq_max_count = cpu_to_be16(count); 182 cq_context->cq_period = cpu_to_be16(period); 183 184 err = mlx4_MODIFY_CQ(dev, mailbox, cq->cqn, 1); 185 186 mlx4_free_cmd_mailbox(dev, mailbox); 187 return err; 188} 189EXPORT_SYMBOL_GPL(mlx4_cq_modify); 190 191int mlx4_cq_resize(struct mlx4_dev *dev, struct mlx4_cq *cq, 192 int entries, struct mlx4_mtt *mtt) 193{ 194 struct mlx4_cmd_mailbox *mailbox; 195 struct mlx4_cq_context *cq_context; 196 u64 mtt_addr; 197 int err; 198 199 mailbox = mlx4_alloc_cmd_mailbox(dev); 200 if (IS_ERR(mailbox)) 201 return PTR_ERR(mailbox); 202 203 cq_context = mailbox->buf; 204 cq_context->logsize_usrpage = cpu_to_be32(ilog2(entries) << 24); 205 cq_context->log_page_size = mtt->page_shift - 12; 206 mtt_addr = mlx4_mtt_addr(dev, mtt); 207 cq_context->mtt_base_addr_h = mtt_addr >> 32; 208 cq_context->mtt_base_addr_l = cpu_to_be32(mtt_addr & 0xffffffff); 209 210 err = mlx4_MODIFY_CQ(dev, mailbox, cq->cqn, 0); 211 212 mlx4_free_cmd_mailbox(dev, mailbox); 213 return err; 214} 215EXPORT_SYMBOL_GPL(mlx4_cq_resize); 216 217int __mlx4_cq_alloc_icm(struct mlx4_dev *dev, int *cqn) 218{ 219 struct mlx4_priv *priv = mlx4_priv(dev); 220 struct mlx4_cq_table *cq_table = &priv->cq_table; 221 int err; 222 223 *cqn = mlx4_bitmap_alloc(&cq_table->bitmap); 224 if (*cqn == -1) 225 return -ENOMEM; 226 227 err = mlx4_table_get(dev, &cq_table->table, *cqn); 228 if (err) 229 goto err_out; 230 231 err = mlx4_table_get(dev, &cq_table->cmpt_table, *cqn); 232 if (err) 233 goto err_put; 234 return 0; 235 236err_put: 237 mlx4_table_put(dev, &cq_table->table, *cqn); 238 239err_out: 240 mlx4_bitmap_free(&cq_table->bitmap, *cqn, MLX4_NO_RR); 241 return err; 242} 243 244static int mlx4_cq_alloc_icm(struct mlx4_dev *dev, int *cqn, u8 usage) 245{ 246 u32 in_modifier = RES_CQ | (((u32)usage & 3) << 30); 247 u64 out_param; 248 int err; 249 250 if (mlx4_is_mfunc(dev)) { 251 err = mlx4_cmd_imm(dev, 0, &out_param, in_modifier, 252 RES_OP_RESERVE_AND_MAP, MLX4_CMD_ALLOC_RES, 253 MLX4_CMD_TIME_CLASS_A, MLX4_CMD_WRAPPED); 254 if (err) 255 return err; 256 else { 257 *cqn = get_param_l(&out_param); 258 return 0; 259 } 260 } 261 return __mlx4_cq_alloc_icm(dev, cqn); 262} 263 264void __mlx4_cq_free_icm(struct mlx4_dev *dev, int cqn) 265{ 266 struct mlx4_priv *priv = mlx4_priv(dev); 267 struct mlx4_cq_table *cq_table = &priv->cq_table; 268 269 mlx4_table_put(dev, &cq_table->cmpt_table, cqn); 270 mlx4_table_put(dev, &cq_table->table, cqn); 271 mlx4_bitmap_free(&cq_table->bitmap, cqn, MLX4_NO_RR); 272} 273 274static void mlx4_cq_free_icm(struct mlx4_dev *dev, int cqn) 275{ 276 u64 in_param = 0; 277 int err; 278 279 if (mlx4_is_mfunc(dev)) { 280 set_param_l(&in_param, cqn); 281 err = mlx4_cmd(dev, in_param, RES_CQ, RES_OP_RESERVE_AND_MAP, 282 MLX4_CMD_FREE_RES, 283 MLX4_CMD_TIME_CLASS_A, MLX4_CMD_WRAPPED); 284 if (err) 285 mlx4_warn(dev, "Failed freeing cq:%d\n", cqn); 286 } else 287 __mlx4_cq_free_icm(dev, cqn); 288} 289 290static int mlx4_init_user_cqes(void *buf, int entries, int cqe_size) 291{ 292 int entries_per_copy = PAGE_SIZE / cqe_size; 293 void *init_ents; 294 int err = 0; 295 int i; 296 297 init_ents = kmalloc(PAGE_SIZE, GFP_KERNEL); 298 if (!init_ents) 299 return -ENOMEM; 300 301 /* Populate a list of CQ entries to reduce the number of 302 * copy_to_user calls. 0xcc is the initialization value 303 * required by the FW. 304 */ 305 memset(init_ents, 0xcc, PAGE_SIZE); 306 307 if (entries_per_copy < entries) { 308 for (i = 0; i < entries / entries_per_copy; i++) { 309 err = copy_to_user((void __user *)buf, init_ents, PAGE_SIZE) ? 310 -EFAULT : 0; 311 if (err) 312 goto out; 313 314 buf += PAGE_SIZE; 315 } 316 } else { 317 err = copy_to_user((void __user *)buf, init_ents, 318 array_size(entries, cqe_size)) ? 319 -EFAULT : 0; 320 } 321 322out: 323 kfree(init_ents); 324 325 return err; 326} 327 328static void mlx4_init_kernel_cqes(struct mlx4_buf *buf, 329 int entries, 330 int cqe_size) 331{ 332 int i; 333 334 if (buf->nbufs == 1) 335 memset(buf->direct.buf, 0xcc, entries * cqe_size); 336 else 337 for (i = 0; i < buf->npages; i++) 338 memset(buf->page_list[i].buf, 0xcc, 339 1UL << buf->page_shift); 340} 341 342int mlx4_cq_alloc(struct mlx4_dev *dev, int nent, 343 struct mlx4_mtt *mtt, struct mlx4_uar *uar, u64 db_rec, 344 struct mlx4_cq *cq, unsigned vector, int collapsed, 345 int timestamp_en, void *buf_addr, bool user_cq) 346{ 347 bool sw_cq_init = dev->caps.flags2 & MLX4_DEV_CAP_FLAG2_SW_CQ_INIT; 348 struct mlx4_priv *priv = mlx4_priv(dev); 349 struct mlx4_cq_table *cq_table = &priv->cq_table; 350 struct mlx4_cmd_mailbox *mailbox; 351 struct mlx4_cq_context *cq_context; 352 u64 mtt_addr; 353 int err; 354 355 if (vector >= dev->caps.num_comp_vectors) 356 return -EINVAL; 357 358 cq->vector = vector; 359 360 err = mlx4_cq_alloc_icm(dev, &cq->cqn, cq->usage); 361 if (err) 362 return err; 363 364 spin_lock(&cq_table->lock); 365 err = radix_tree_insert(&cq_table->tree, cq->cqn, cq); 366 spin_unlock(&cq_table->lock); 367 if (err) 368 goto err_icm; 369 370 mailbox = mlx4_alloc_cmd_mailbox(dev); 371 if (IS_ERR(mailbox)) { 372 err = PTR_ERR(mailbox); 373 goto err_radix; 374 } 375 376 cq_context = mailbox->buf; 377 cq_context->flags = cpu_to_be32(!!collapsed << 18); 378 if (timestamp_en) 379 cq_context->flags |= cpu_to_be32(1 << 19); 380 381 cq_context->logsize_usrpage = 382 cpu_to_be32((ilog2(nent) << 24) | 383 mlx4_to_hw_uar_index(dev, uar->index)); 384 cq_context->comp_eqn = priv->eq_table.eq[MLX4_CQ_TO_EQ_VECTOR(vector)].eqn; 385 cq_context->log_page_size = mtt->page_shift - MLX4_ICM_PAGE_SHIFT; 386 387 mtt_addr = mlx4_mtt_addr(dev, mtt); 388 cq_context->mtt_base_addr_h = mtt_addr >> 32; 389 cq_context->mtt_base_addr_l = cpu_to_be32(mtt_addr & 0xffffffff); 390 cq_context->db_rec_addr = cpu_to_be64(db_rec); 391 392 if (sw_cq_init) { 393 if (user_cq) { 394 err = mlx4_init_user_cqes(buf_addr, nent, 395 dev->caps.cqe_size); 396 if (err) 397 sw_cq_init = false; 398 } else { 399 mlx4_init_kernel_cqes(buf_addr, nent, 400 dev->caps.cqe_size); 401 } 402 } 403 404 err = mlx4_SW2HW_CQ(dev, mailbox, cq->cqn, sw_cq_init); 405 406 mlx4_free_cmd_mailbox(dev, mailbox); 407 if (err) 408 goto err_radix; 409 410 cq->cons_index = 0; 411 cq->arm_sn = 1; 412 cq->uar = uar; 413 refcount_set(&cq->refcount, 1); 414 init_completion(&cq->free); 415 cq->comp = mlx4_add_cq_to_tasklet; 416 cq->tasklet_ctx.priv = 417 &priv->eq_table.eq[MLX4_CQ_TO_EQ_VECTOR(vector)].tasklet_ctx; 418 INIT_LIST_HEAD(&cq->tasklet_ctx.list); 419 420 421 cq->irq = priv->eq_table.eq[MLX4_CQ_TO_EQ_VECTOR(vector)].irq; 422 return 0; 423 424err_radix: 425 spin_lock(&cq_table->lock); 426 radix_tree_delete(&cq_table->tree, cq->cqn); 427 spin_unlock(&cq_table->lock); 428 429err_icm: 430 mlx4_cq_free_icm(dev, cq->cqn); 431 432 return err; 433} 434EXPORT_SYMBOL_GPL(mlx4_cq_alloc); 435 436void mlx4_cq_free(struct mlx4_dev *dev, struct mlx4_cq *cq) 437{ 438 struct mlx4_priv *priv = mlx4_priv(dev); 439 struct mlx4_cq_table *cq_table = &priv->cq_table; 440 int err; 441 442 err = mlx4_HW2SW_CQ(dev, NULL, cq->cqn); 443 if (err) 444 mlx4_warn(dev, "HW2SW_CQ failed (%d) for CQN %06x\n", err, cq->cqn); 445 446 spin_lock(&cq_table->lock); 447 radix_tree_delete(&cq_table->tree, cq->cqn); 448 spin_unlock(&cq_table->lock); 449 450 synchronize_irq(priv->eq_table.eq[MLX4_CQ_TO_EQ_VECTOR(cq->vector)].irq); 451 if (priv->eq_table.eq[MLX4_CQ_TO_EQ_VECTOR(cq->vector)].irq != 452 priv->eq_table.eq[MLX4_EQ_ASYNC].irq) 453 synchronize_irq(priv->eq_table.eq[MLX4_EQ_ASYNC].irq); 454 455 if (refcount_dec_and_test(&cq->refcount)) 456 complete(&cq->free); 457 wait_for_completion(&cq->free); 458 459 mlx4_cq_free_icm(dev, cq->cqn); 460} 461EXPORT_SYMBOL_GPL(mlx4_cq_free); 462 463int mlx4_init_cq_table(struct mlx4_dev *dev) 464{ 465 struct mlx4_cq_table *cq_table = &mlx4_priv(dev)->cq_table; 466 467 spin_lock_init(&cq_table->lock); 468 INIT_RADIX_TREE(&cq_table->tree, GFP_ATOMIC); 469 if (mlx4_is_slave(dev)) 470 return 0; 471 472 return mlx4_bitmap_init(&cq_table->bitmap, dev->caps.num_cqs, 473 dev->caps.num_cqs - 1, dev->caps.reserved_cqs, 0); 474} 475 476void mlx4_cleanup_cq_table(struct mlx4_dev *dev) 477{ 478 if (mlx4_is_slave(dev)) 479 return; 480 /* Nothing to do to clean up radix_tree */ 481 mlx4_bitmap_cleanup(&mlx4_priv(dev)->cq_table.bitmap); 482}