| /* |
| * Copyright (c) 2004 Topspin Communications. All rights reserved. |
| * Copyright (c) 2005 Mellanox Technologies. All rights reserved. |
| * |
| * This software is available to you under a choice of one of two |
| * licenses. You may choose to be licensed under the terms of the GNU |
| * General Public License (GPL) Version 2, available from the file |
| * COPYING in the main directory of this source tree, or the |
| * OpenIB.org BSD license below: |
| * |
| * Redistribution and use in source and binary forms, with or |
| * without modification, are permitted provided that the following |
| * conditions are met: |
| * |
| * - Redistributions of source code must retain the above |
| * copyright notice, this list of conditions and the following |
| * disclaimer. |
| * |
| * - Redistributions in binary form must reproduce the above |
| * copyright notice, this list of conditions and the following |
| * disclaimer in the documentation and/or other materials |
| * provided with the distribution. |
| * |
| * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, |
| * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF |
| * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND |
| * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS |
| * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN |
| * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN |
| * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE |
| * SOFTWARE. |
| */ |
| |
| #include <linux/slab.h> |
| #include <linux/errno.h> |
| |
| #include "mthca_dev.h" |
| #include "mthca_cmd.h" |
| #include "mthca_memfree.h" |
| |
| struct mthca_mtt { |
| struct mthca_buddy *buddy; |
| int order; |
| u32 first_seg; |
| }; |
| |
| /* |
| * Must be packed because mtt_seg is 64 bits but only aligned to 32 bits. |
| */ |
| struct mthca_mpt_entry { |
| __be32 flags; |
| __be32 page_size; |
| __be32 key; |
| __be32 pd; |
| __be64 start; |
| __be64 length; |
| __be32 lkey; |
| __be32 window_count; |
| __be32 window_count_limit; |
| __be64 mtt_seg; |
| __be32 mtt_sz; /* Arbel only */ |
| u32 reserved[2]; |
| } __attribute__((packed)); |
| |
| #define MTHCA_MPT_FLAG_SW_OWNS (0xfUL << 28) |
| #define MTHCA_MPT_FLAG_MIO (1 << 17) |
| #define MTHCA_MPT_FLAG_BIND_ENABLE (1 << 15) |
| #define MTHCA_MPT_FLAG_PHYSICAL (1 << 9) |
| #define MTHCA_MPT_FLAG_REGION (1 << 8) |
| |
| #define MTHCA_MTT_FLAG_PRESENT 1 |
| |
| #define MTHCA_MPT_STATUS_SW 0xF0 |
| #define MTHCA_MPT_STATUS_HW 0x00 |
| |
| #define SINAI_FMR_KEY_INC 0x1000000 |
| |
| /* |
| * Buddy allocator for MTT segments (currently not very efficient |
| * since it doesn't keep a free list and just searches linearly |
| * through the bitmaps) |
| */ |
| |
| static u32 mthca_buddy_alloc(struct mthca_buddy *buddy, int order) |
| { |
| int o; |
| int m; |
| u32 seg; |
| |
| spin_lock(&buddy->lock); |
| |
| for (o = order; o <= buddy->max_order; ++o) |
| if (buddy->num_free[o]) { |
| m = 1 << (buddy->max_order - o); |
| seg = find_first_bit(buddy->bits[o], m); |
| if (seg < m) |
| goto found; |
| } |
| |
| spin_unlock(&buddy->lock); |
| return -1; |
| |
| found: |
| clear_bit(seg, buddy->bits[o]); |
| --buddy->num_free[o]; |
| |
| while (o > order) { |
| --o; |
| seg <<= 1; |
| set_bit(seg ^ 1, buddy->bits[o]); |
| ++buddy->num_free[o]; |
| } |
| |
| spin_unlock(&buddy->lock); |
| |
| seg <<= order; |
| |
| return seg; |
| } |
| |
| static void mthca_buddy_free(struct mthca_buddy *buddy, u32 seg, int order) |
| { |
| seg >>= order; |
| |
| spin_lock(&buddy->lock); |
| |
| while (test_bit(seg ^ 1, buddy->bits[order])) { |
| clear_bit(seg ^ 1, buddy->bits[order]); |
| --buddy->num_free[order]; |
| seg >>= 1; |
| ++order; |
| } |
| |
| set_bit(seg, buddy->bits[order]); |
| ++buddy->num_free[order]; |
| |
| spin_unlock(&buddy->lock); |
| } |
| |
| static int mthca_buddy_init(struct mthca_buddy *buddy, int max_order) |
| { |
| int i, s; |
| |
| buddy->max_order = max_order; |
| spin_lock_init(&buddy->lock); |
| |
| buddy->bits = kzalloc((buddy->max_order + 1) * sizeof (long *), |
| GFP_KERNEL); |
| buddy->num_free = kcalloc((buddy->max_order + 1), sizeof *buddy->num_free, |
| GFP_KERNEL); |
| if (!buddy->bits || !buddy->num_free) |
| goto err_out; |
| |
| for (i = 0; i <= buddy->max_order; ++i) { |
| s = BITS_TO_LONGS(1 << (buddy->max_order - i)); |
| buddy->bits[i] = kmalloc_array(s, sizeof(long), GFP_KERNEL); |
| if (!buddy->bits[i]) |
| goto err_out_free; |
| bitmap_zero(buddy->bits[i], |
| 1 << (buddy->max_order - i)); |
| } |
| |
| set_bit(0, buddy->bits[buddy->max_order]); |
| buddy->num_free[buddy->max_order] = 1; |
| |
| return 0; |
| |
| err_out_free: |
| for (i = 0; i <= buddy->max_order; ++i) |
| kfree(buddy->bits[i]); |
| |
| err_out: |
| kfree(buddy->bits); |
| kfree(buddy->num_free); |
| |
| return -ENOMEM; |
| } |
| |
| static void mthca_buddy_cleanup(struct mthca_buddy *buddy) |
| { |
| int i; |
| |
| for (i = 0; i <= buddy->max_order; ++i) |
| kfree(buddy->bits[i]); |
| |
| kfree(buddy->bits); |
| kfree(buddy->num_free); |
| } |
| |
| static u32 mthca_alloc_mtt_range(struct mthca_dev *dev, int order, |
| struct mthca_buddy *buddy) |
| { |
| u32 seg = mthca_buddy_alloc(buddy, order); |
| |
| if (seg == -1) |
| return -1; |
| |
| if (mthca_is_memfree(dev)) |
| if (mthca_table_get_range(dev, dev->mr_table.mtt_table, seg, |
| seg + (1 << order) - 1)) { |
| mthca_buddy_free(buddy, seg, order); |
| seg = -1; |
| } |
| |
| return seg; |
| } |
| |
| static struct mthca_mtt *__mthca_alloc_mtt(struct mthca_dev *dev, int size, |
| struct mthca_buddy *buddy) |
| { |
| struct mthca_mtt *mtt; |
| int i; |
| |
| if (size <= 0) |
| return ERR_PTR(-EINVAL); |
| |
| mtt = kmalloc(sizeof *mtt, GFP_KERNEL); |
| if (!mtt) |
| return ERR_PTR(-ENOMEM); |
| |
| mtt->buddy = buddy; |
| mtt->order = 0; |
| for (i = dev->limits.mtt_seg_size / 8; i < size; i <<= 1) |
| ++mtt->order; |
| |
| mtt->first_seg = mthca_alloc_mtt_range(dev, mtt->order, buddy); |
| if (mtt->first_seg == -1) { |
| kfree(mtt); |
| return ERR_PTR(-ENOMEM); |
| } |
| |
| return mtt; |
| } |
| |
| struct mthca_mtt *mthca_alloc_mtt(struct mthca_dev *dev, int size) |
| { |
| return __mthca_alloc_mtt(dev, size, &dev->mr_table.mtt_buddy); |
| } |
| |
| void mthca_free_mtt(struct mthca_dev *dev, struct mthca_mtt *mtt) |
| { |
| if (!mtt) |
| return; |
| |
| mthca_buddy_free(mtt->buddy, mtt->first_seg, mtt->order); |
| |
| mthca_table_put_range(dev, dev->mr_table.mtt_table, |
| mtt->first_seg, |
| mtt->first_seg + (1 << mtt->order) - 1); |
| |
| kfree(mtt); |
| } |
| |
| static int __mthca_write_mtt(struct mthca_dev *dev, struct mthca_mtt *mtt, |
| int start_index, u64 *buffer_list, int list_len) |
| { |
| struct mthca_mailbox *mailbox; |
| __be64 *mtt_entry; |
| int err = 0; |
| int i; |
| |
| mailbox = mthca_alloc_mailbox(dev, GFP_KERNEL); |
| if (IS_ERR(mailbox)) |
| return PTR_ERR(mailbox); |
| mtt_entry = mailbox->buf; |
| |
| while (list_len > 0) { |
| mtt_entry[0] = cpu_to_be64(dev->mr_table.mtt_base + |
| mtt->first_seg * dev->limits.mtt_seg_size + |
| start_index * 8); |
| mtt_entry[1] = 0; |
| for (i = 0; i < list_len && i < MTHCA_MAILBOX_SIZE / 8 - 2; ++i) |
| mtt_entry[i + 2] = cpu_to_be64(buffer_list[i] | |
| MTHCA_MTT_FLAG_PRESENT); |
| |
| /* |
| * If we have an odd number of entries to write, add |
| * one more dummy entry for firmware efficiency. |
| */ |
| if (i & 1) |
| mtt_entry[i + 2] = 0; |
| |
| err = mthca_WRITE_MTT(dev, mailbox, (i + 1) & ~1); |
| if (err) { |
| mthca_warn(dev, "WRITE_MTT failed (%d)\n", err); |
| goto out; |
| } |
| |
| list_len -= i; |
| start_index += i; |
| buffer_list += i; |
| } |
| |
| out: |
| mthca_free_mailbox(dev, mailbox); |
| return err; |
| } |
| |
| int mthca_write_mtt_size(struct mthca_dev *dev) |
| { |
| if (dev->mr_table.fmr_mtt_buddy != &dev->mr_table.mtt_buddy || |
| !(dev->mthca_flags & MTHCA_FLAG_FMR)) |
| /* |
| * Be friendly to WRITE_MTT command |
| * and leave two empty slots for the |
| * index and reserved fields of the |
| * mailbox. |
| */ |
| return PAGE_SIZE / sizeof (u64) - 2; |
| |
| /* For Arbel, all MTTs must fit in the same page. */ |
| return mthca_is_memfree(dev) ? (PAGE_SIZE / sizeof (u64)) : 0x7ffffff; |
| } |
| |
| static void mthca_tavor_write_mtt_seg(struct mthca_dev *dev, |
| struct mthca_mtt *mtt, int start_index, |
| u64 *buffer_list, int list_len) |
| { |
| u64 __iomem *mtts; |
| int i; |
| |
| mtts = dev->mr_table.tavor_fmr.mtt_base + mtt->first_seg * dev->limits.mtt_seg_size + |
| start_index * sizeof (u64); |
| for (i = 0; i < list_len; ++i) |
| mthca_write64_raw(cpu_to_be64(buffer_list[i] | MTHCA_MTT_FLAG_PRESENT), |
| mtts + i); |
| } |
| |
| static void mthca_arbel_write_mtt_seg(struct mthca_dev *dev, |
| struct mthca_mtt *mtt, int start_index, |
| u64 *buffer_list, int list_len) |
| { |
| __be64 *mtts; |
| dma_addr_t dma_handle; |
| int i; |
| int s = start_index * sizeof (u64); |
| |
| /* For Arbel, all MTTs must fit in the same page. */ |
| BUG_ON(s / PAGE_SIZE != (s + list_len * sizeof(u64) - 1) / PAGE_SIZE); |
| /* Require full segments */ |
| BUG_ON(s % dev->limits.mtt_seg_size); |
| |
| mtts = mthca_table_find(dev->mr_table.mtt_table, mtt->first_seg + |
| s / dev->limits.mtt_seg_size, &dma_handle); |
| |
| BUG_ON(!mtts); |
| |
| dma_sync_single_for_cpu(&dev->pdev->dev, dma_handle, |
| list_len * sizeof (u64), DMA_TO_DEVICE); |
| |
| for (i = 0; i < list_len; ++i) |
| mtts[i] = cpu_to_be64(buffer_list[i] | MTHCA_MTT_FLAG_PRESENT); |
| |
| dma_sync_single_for_device(&dev->pdev->dev, dma_handle, |
| list_len * sizeof (u64), DMA_TO_DEVICE); |
| } |
| |
| int mthca_write_mtt(struct mthca_dev *dev, struct mthca_mtt *mtt, |
| int start_index, u64 *buffer_list, int list_len) |
| { |
| int size = mthca_write_mtt_size(dev); |
| int chunk; |
| |
| if (dev->mr_table.fmr_mtt_buddy != &dev->mr_table.mtt_buddy || |
| !(dev->mthca_flags & MTHCA_FLAG_FMR)) |
| return __mthca_write_mtt(dev, mtt, start_index, buffer_list, list_len); |
| |
| while (list_len > 0) { |
| chunk = min(size, list_len); |
| if (mthca_is_memfree(dev)) |
| mthca_arbel_write_mtt_seg(dev, mtt, start_index, |
| buffer_list, chunk); |
| else |
| mthca_tavor_write_mtt_seg(dev, mtt, start_index, |
| buffer_list, chunk); |
| |
| list_len -= chunk; |
| start_index += chunk; |
| buffer_list += chunk; |
| } |
| |
| return 0; |
| } |
| |
| static inline u32 tavor_hw_index_to_key(u32 ind) |
| { |
| return ind; |
| } |
| |
| static inline u32 tavor_key_to_hw_index(u32 key) |
| { |
| return key; |
| } |
| |
| static inline u32 arbel_hw_index_to_key(u32 ind) |
| { |
| return (ind >> 24) | (ind << 8); |
| } |
| |
| static inline u32 arbel_key_to_hw_index(u32 key) |
| { |
| return (key << 24) | (key >> 8); |
| } |
| |
| static inline u32 hw_index_to_key(struct mthca_dev *dev, u32 ind) |
| { |
| if (mthca_is_memfree(dev)) |
| return arbel_hw_index_to_key(ind); |
| else |
| return tavor_hw_index_to_key(ind); |
| } |
| |
| static inline u32 key_to_hw_index(struct mthca_dev *dev, u32 key) |
| { |
| if (mthca_is_memfree(dev)) |
| return arbel_key_to_hw_index(key); |
| else |
| return tavor_key_to_hw_index(key); |
| } |
| |
| static inline u32 adjust_key(struct mthca_dev *dev, u32 key) |
| { |
| if (dev->mthca_flags & MTHCA_FLAG_SINAI_OPT) |
| return ((key << 20) & 0x800000) | (key & 0x7fffff); |
| else |
| return key; |
| } |
| |
| int mthca_mr_alloc(struct mthca_dev *dev, u32 pd, int buffer_size_shift, |
| u64 iova, u64 total_size, u32 access, struct mthca_mr *mr) |
| { |
| struct mthca_mailbox *mailbox; |
| struct mthca_mpt_entry *mpt_entry; |
| u32 key; |
| int i; |
| int err; |
| |
| WARN_ON(buffer_size_shift >= 32); |
| |
| key = mthca_alloc(&dev->mr_table.mpt_alloc); |
| if (key == -1) |
| return -ENOMEM; |
| key = adjust_key(dev, key); |
| mr->ibmr.rkey = mr->ibmr.lkey = hw_index_to_key(dev, key); |
| |
| if (mthca_is_memfree(dev)) { |
| err = mthca_table_get(dev, dev->mr_table.mpt_table, key); |
| if (err) |
| goto err_out_mpt_free; |
| } |
| |
| mailbox = mthca_alloc_mailbox(dev, GFP_KERNEL); |
| if (IS_ERR(mailbox)) { |
| err = PTR_ERR(mailbox); |
| goto err_out_table; |
| } |
| mpt_entry = mailbox->buf; |
| |
| mpt_entry->flags = cpu_to_be32(MTHCA_MPT_FLAG_SW_OWNS | |
| MTHCA_MPT_FLAG_MIO | |
| MTHCA_MPT_FLAG_REGION | |
| access); |
| if (!mr->mtt) |
| mpt_entry->flags |= cpu_to_be32(MTHCA_MPT_FLAG_PHYSICAL); |
| |
| mpt_entry->page_size = cpu_to_be32(buffer_size_shift - 12); |
| mpt_entry->key = cpu_to_be32(key); |
| mpt_entry->pd = cpu_to_be32(pd); |
| mpt_entry->start = cpu_to_be64(iova); |
| mpt_entry->length = cpu_to_be64(total_size); |
| |
| memset(&mpt_entry->lkey, 0, |
| sizeof *mpt_entry - offsetof(struct mthca_mpt_entry, lkey)); |
| |
| if (mr->mtt) |
| mpt_entry->mtt_seg = |
| cpu_to_be64(dev->mr_table.mtt_base + |
| mr->mtt->first_seg * dev->limits.mtt_seg_size); |
| |
| if (0) { |
| mthca_dbg(dev, "Dumping MPT entry %08x:\n", mr->ibmr.lkey); |
| for (i = 0; i < sizeof (struct mthca_mpt_entry) / 4; ++i) { |
| if (i % 4 == 0) |
| printk("[%02x] ", i * 4); |
| printk(" %08x", be32_to_cpu(((__be32 *) mpt_entry)[i])); |
| if ((i + 1) % 4 == 0) |
| printk("\n"); |
| } |
| } |
| |
| err = mthca_SW2HW_MPT(dev, mailbox, |
| key & (dev->limits.num_mpts - 1)); |
| if (err) { |
| mthca_warn(dev, "SW2HW_MPT failed (%d)\n", err); |
| goto err_out_mailbox; |
| } |
| |
| mthca_free_mailbox(dev, mailbox); |
| return err; |
| |
| err_out_mailbox: |
| mthca_free_mailbox(dev, mailbox); |
| |
| err_out_table: |
| mthca_table_put(dev, dev->mr_table.mpt_table, key); |
| |
| err_out_mpt_free: |
| mthca_free(&dev->mr_table.mpt_alloc, key); |
| return err; |
| } |
| |
| int mthca_mr_alloc_notrans(struct mthca_dev *dev, u32 pd, |
| u32 access, struct mthca_mr *mr) |
| { |
| mr->mtt = NULL; |
| return mthca_mr_alloc(dev, pd, 12, 0, ~0ULL, access, mr); |
| } |
| |
| int mthca_mr_alloc_phys(struct mthca_dev *dev, u32 pd, |
| u64 *buffer_list, int buffer_size_shift, |
| int list_len, u64 iova, u64 total_size, |
| u32 access, struct mthca_mr *mr) |
| { |
| int err; |
| |
| mr->mtt = mthca_alloc_mtt(dev, list_len); |
| if (IS_ERR(mr->mtt)) |
| return PTR_ERR(mr->mtt); |
| |
| err = mthca_write_mtt(dev, mr->mtt, 0, buffer_list, list_len); |
| if (err) { |
| mthca_free_mtt(dev, mr->mtt); |
| return err; |
| } |
| |
| err = mthca_mr_alloc(dev, pd, buffer_size_shift, iova, |
| total_size, access, mr); |
| if (err) |
| mthca_free_mtt(dev, mr->mtt); |
| |
| return err; |
| } |
| |
| /* Free mr or fmr */ |
| static void mthca_free_region(struct mthca_dev *dev, u32 lkey) |
| { |
| mthca_table_put(dev, dev->mr_table.mpt_table, |
| key_to_hw_index(dev, lkey)); |
| |
| mthca_free(&dev->mr_table.mpt_alloc, key_to_hw_index(dev, lkey)); |
| } |
| |
| void mthca_free_mr(struct mthca_dev *dev, struct mthca_mr *mr) |
| { |
| int err; |
| |
| err = mthca_HW2SW_MPT(dev, NULL, |
| key_to_hw_index(dev, mr->ibmr.lkey) & |
| (dev->limits.num_mpts - 1)); |
| if (err) |
| mthca_warn(dev, "HW2SW_MPT failed (%d)\n", err); |
| |
| mthca_free_region(dev, mr->ibmr.lkey); |
| mthca_free_mtt(dev, mr->mtt); |
| } |
| |
| int mthca_fmr_alloc(struct mthca_dev *dev, u32 pd, |
| u32 access, struct mthca_fmr *mr) |
| { |
| struct mthca_mpt_entry *mpt_entry; |
| struct mthca_mailbox *mailbox; |
| u64 mtt_seg; |
| u32 key, idx; |
| int list_len = mr->attr.max_pages; |
| int err = -ENOMEM; |
| int i; |
| |
| if (mr->attr.page_shift < 12 || mr->attr.page_shift >= 32) |
| return -EINVAL; |
| |
| /* For Arbel, all MTTs must fit in the same page. */ |
| if (mthca_is_memfree(dev) && |
| mr->attr.max_pages * sizeof *mr->mem.arbel.mtts > PAGE_SIZE) |
| return -EINVAL; |
| |
| mr->maps = 0; |
| |
| key = mthca_alloc(&dev->mr_table.mpt_alloc); |
| if (key == -1) |
| return -ENOMEM; |
| key = adjust_key(dev, key); |
| |
| idx = key & (dev->limits.num_mpts - 1); |
| mr->ibmr.rkey = mr->ibmr.lkey = hw_index_to_key(dev, key); |
| |
| if (mthca_is_memfree(dev)) { |
| err = mthca_table_get(dev, dev->mr_table.mpt_table, key); |
| if (err) |
| goto err_out_mpt_free; |
| |
| mr->mem.arbel.mpt = mthca_table_find(dev->mr_table.mpt_table, key, NULL); |
| BUG_ON(!mr->mem.arbel.mpt); |
| } else |
| mr->mem.tavor.mpt = dev->mr_table.tavor_fmr.mpt_base + |
| sizeof *(mr->mem.tavor.mpt) * idx; |
| |
| mr->mtt = __mthca_alloc_mtt(dev, list_len, dev->mr_table.fmr_mtt_buddy); |
| if (IS_ERR(mr->mtt)) { |
| err = PTR_ERR(mr->mtt); |
| goto err_out_table; |
| } |
| |
| mtt_seg = mr->mtt->first_seg * dev->limits.mtt_seg_size; |
| |
| if (mthca_is_memfree(dev)) { |
| mr->mem.arbel.mtts = mthca_table_find(dev->mr_table.mtt_table, |
| mr->mtt->first_seg, |
| &mr->mem.arbel.dma_handle); |
| BUG_ON(!mr->mem.arbel.mtts); |
| } else |
| mr->mem.tavor.mtts = dev->mr_table.tavor_fmr.mtt_base + mtt_seg; |
| |
| mailbox = mthca_alloc_mailbox(dev, GFP_KERNEL); |
| if (IS_ERR(mailbox)) { |
| err = PTR_ERR(mailbox); |
| goto err_out_free_mtt; |
| } |
| |
| mpt_entry = mailbox->buf; |
| |
| mpt_entry->flags = cpu_to_be32(MTHCA_MPT_FLAG_SW_OWNS | |
| MTHCA_MPT_FLAG_MIO | |
| MTHCA_MPT_FLAG_REGION | |
| access); |
| |
| mpt_entry->page_size = cpu_to_be32(mr->attr.page_shift - 12); |
| mpt_entry->key = cpu_to_be32(key); |
| mpt_entry->pd = cpu_to_be32(pd); |
| memset(&mpt_entry->start, 0, |
| sizeof *mpt_entry - offsetof(struct mthca_mpt_entry, start)); |
| mpt_entry->mtt_seg = cpu_to_be64(dev->mr_table.mtt_base + mtt_seg); |
| |
| if (0) { |
| mthca_dbg(dev, "Dumping MPT entry %08x:\n", mr->ibmr.lkey); |
| for (i = 0; i < sizeof (struct mthca_mpt_entry) / 4; ++i) { |
| if (i % 4 == 0) |
| printk("[%02x] ", i * 4); |
| printk(" %08x", be32_to_cpu(((__be32 *) mpt_entry)[i])); |
| if ((i + 1) % 4 == 0) |
| printk("\n"); |
| } |
| } |
| |
| err = mthca_SW2HW_MPT(dev, mailbox, |
| key & (dev->limits.num_mpts - 1)); |
| if (err) { |
| mthca_warn(dev, "SW2HW_MPT failed (%d)\n", err); |
| goto err_out_mailbox_free; |
| } |
| |
| mthca_free_mailbox(dev, mailbox); |
| return 0; |
| |
| err_out_mailbox_free: |
| mthca_free_mailbox(dev, mailbox); |
| |
| err_out_free_mtt: |
| mthca_free_mtt(dev, mr->mtt); |
| |
| err_out_table: |
| mthca_table_put(dev, dev->mr_table.mpt_table, key); |
| |
| err_out_mpt_free: |
| mthca_free(&dev->mr_table.mpt_alloc, key); |
| return err; |
| } |
| |
| int mthca_free_fmr(struct mthca_dev *dev, struct mthca_fmr *fmr) |
| { |
| if (fmr->maps) |
| return -EBUSY; |
| |
| mthca_free_region(dev, fmr->ibmr.lkey); |
| mthca_free_mtt(dev, fmr->mtt); |
| |
| return 0; |
| } |
| |
| static inline int mthca_check_fmr(struct mthca_fmr *fmr, u64 *page_list, |
| int list_len, u64 iova) |
| { |
| int i, page_mask; |
| |
| if (list_len > fmr->attr.max_pages) |
| return -EINVAL; |
| |
| page_mask = (1 << fmr->attr.page_shift) - 1; |
| |
| /* We are getting page lists, so va must be page aligned. */ |
| if (iova & page_mask) |
| return -EINVAL; |
| |
| /* Trust the user not to pass misaligned data in page_list */ |
| if (0) |
| for (i = 0; i < list_len; ++i) { |
| if (page_list[i] & ~page_mask) |
| return -EINVAL; |
| } |
| |
| if (fmr->maps >= fmr->attr.max_maps) |
| return -EINVAL; |
| |
| return 0; |
| } |
| |
| |
| int mthca_tavor_map_phys_fmr(struct ib_fmr *ibfmr, u64 *page_list, |
| int list_len, u64 iova) |
| { |
| struct mthca_fmr *fmr = to_mfmr(ibfmr); |
| struct mthca_dev *dev = to_mdev(ibfmr->device); |
| struct mthca_mpt_entry mpt_entry; |
| u32 key; |
| int i, err; |
| |
| err = mthca_check_fmr(fmr, page_list, list_len, iova); |
| if (err) |
| return err; |
| |
| ++fmr->maps; |
| |
| key = tavor_key_to_hw_index(fmr->ibmr.lkey); |
| key += dev->limits.num_mpts; |
| fmr->ibmr.lkey = fmr->ibmr.rkey = tavor_hw_index_to_key(key); |
| |
| writeb(MTHCA_MPT_STATUS_SW, fmr->mem.tavor.mpt); |
| |
| for (i = 0; i < list_len; ++i) { |
| __be64 mtt_entry = cpu_to_be64(page_list[i] | |
| MTHCA_MTT_FLAG_PRESENT); |
| mthca_write64_raw(mtt_entry, fmr->mem.tavor.mtts + i); |
| } |
| |
| mpt_entry.lkey = cpu_to_be32(key); |
| mpt_entry.length = cpu_to_be64(list_len * (1ull << fmr->attr.page_shift)); |
| mpt_entry.start = cpu_to_be64(iova); |
| |
| __raw_writel((__force u32) mpt_entry.lkey, &fmr->mem.tavor.mpt->key); |
| memcpy_toio(&fmr->mem.tavor.mpt->start, &mpt_entry.start, |
| offsetof(struct mthca_mpt_entry, window_count) - |
| offsetof(struct mthca_mpt_entry, start)); |
| |
| writeb(MTHCA_MPT_STATUS_HW, fmr->mem.tavor.mpt); |
| |
| return 0; |
| } |
| |
| int mthca_arbel_map_phys_fmr(struct ib_fmr *ibfmr, u64 *page_list, |
| int list_len, u64 iova) |
| { |
| struct mthca_fmr *fmr = to_mfmr(ibfmr); |
| struct mthca_dev *dev = to_mdev(ibfmr->device); |
| u32 key; |
| int i, err; |
| |
| err = mthca_check_fmr(fmr, page_list, list_len, iova); |
| if (err) |
| return err; |
| |
| ++fmr->maps; |
| |
| key = arbel_key_to_hw_index(fmr->ibmr.lkey); |
| if (dev->mthca_flags & MTHCA_FLAG_SINAI_OPT) |
| key += SINAI_FMR_KEY_INC; |
| else |
| key += dev->limits.num_mpts; |
| fmr->ibmr.lkey = fmr->ibmr.rkey = arbel_hw_index_to_key(key); |
| |
| *(u8 *) fmr->mem.arbel.mpt = MTHCA_MPT_STATUS_SW; |
| |
| wmb(); |
| |
| dma_sync_single_for_cpu(&dev->pdev->dev, fmr->mem.arbel.dma_handle, |
| list_len * sizeof(u64), DMA_TO_DEVICE); |
| |
| for (i = 0; i < list_len; ++i) |
| fmr->mem.arbel.mtts[i] = cpu_to_be64(page_list[i] | |
| MTHCA_MTT_FLAG_PRESENT); |
| |
| dma_sync_single_for_device(&dev->pdev->dev, fmr->mem.arbel.dma_handle, |
| list_len * sizeof(u64), DMA_TO_DEVICE); |
| |
| fmr->mem.arbel.mpt->key = cpu_to_be32(key); |
| fmr->mem.arbel.mpt->lkey = cpu_to_be32(key); |
| fmr->mem.arbel.mpt->length = cpu_to_be64(list_len * (1ull << fmr->attr.page_shift)); |
| fmr->mem.arbel.mpt->start = cpu_to_be64(iova); |
| |
| wmb(); |
| |
| *(u8 *) fmr->mem.arbel.mpt = MTHCA_MPT_STATUS_HW; |
| |
| wmb(); |
| |
| return 0; |
| } |
| |
| void mthca_tavor_fmr_unmap(struct mthca_dev *dev, struct mthca_fmr *fmr) |
| { |
| if (!fmr->maps) |
| return; |
| |
| fmr->maps = 0; |
| |
| writeb(MTHCA_MPT_STATUS_SW, fmr->mem.tavor.mpt); |
| } |
| |
| void mthca_arbel_fmr_unmap(struct mthca_dev *dev, struct mthca_fmr *fmr) |
| { |
| if (!fmr->maps) |
| return; |
| |
| fmr->maps = 0; |
| |
| *(u8 *) fmr->mem.arbel.mpt = MTHCA_MPT_STATUS_SW; |
| } |
| |
| int mthca_init_mr_table(struct mthca_dev *dev) |
| { |
| phys_addr_t addr; |
| int mpts, mtts, err, i; |
| |
| err = mthca_alloc_init(&dev->mr_table.mpt_alloc, |
| dev->limits.num_mpts, |
| ~0, dev->limits.reserved_mrws); |
| if (err) |
| return err; |
| |
| if (!mthca_is_memfree(dev) && |
| (dev->mthca_flags & MTHCA_FLAG_DDR_HIDDEN)) |
| dev->limits.fmr_reserved_mtts = 0; |
| else |
| dev->mthca_flags |= MTHCA_FLAG_FMR; |
| |
| if (dev->mthca_flags & MTHCA_FLAG_SINAI_OPT) |
| mthca_dbg(dev, "Memory key throughput optimization activated.\n"); |
| |
| err = mthca_buddy_init(&dev->mr_table.mtt_buddy, |
| fls(dev->limits.num_mtt_segs - 1)); |
| |
| if (err) |
| goto err_mtt_buddy; |
| |
| dev->mr_table.tavor_fmr.mpt_base = NULL; |
| dev->mr_table.tavor_fmr.mtt_base = NULL; |
| |
| if (dev->limits.fmr_reserved_mtts) { |
| i = fls(dev->limits.fmr_reserved_mtts - 1); |
| |
| if (i >= 31) { |
| mthca_warn(dev, "Unable to reserve 2^31 FMR MTTs.\n"); |
| err = -EINVAL; |
| goto err_fmr_mpt; |
| } |
| mpts = mtts = 1 << i; |
| } else { |
| mtts = dev->limits.num_mtt_segs; |
| mpts = dev->limits.num_mpts; |
| } |
| |
| if (!mthca_is_memfree(dev) && |
| (dev->mthca_flags & MTHCA_FLAG_FMR)) { |
| |
| addr = pci_resource_start(dev->pdev, 4) + |
| ((pci_resource_len(dev->pdev, 4) - 1) & |
| dev->mr_table.mpt_base); |
| |
| dev->mr_table.tavor_fmr.mpt_base = |
| ioremap(addr, mpts * sizeof(struct mthca_mpt_entry)); |
| |
| if (!dev->mr_table.tavor_fmr.mpt_base) { |
| mthca_warn(dev, "MPT ioremap for FMR failed.\n"); |
| err = -ENOMEM; |
| goto err_fmr_mpt; |
| } |
| |
| addr = pci_resource_start(dev->pdev, 4) + |
| ((pci_resource_len(dev->pdev, 4) - 1) & |
| dev->mr_table.mtt_base); |
| |
| dev->mr_table.tavor_fmr.mtt_base = |
| ioremap(addr, mtts * dev->limits.mtt_seg_size); |
| if (!dev->mr_table.tavor_fmr.mtt_base) { |
| mthca_warn(dev, "MTT ioremap for FMR failed.\n"); |
| err = -ENOMEM; |
| goto err_fmr_mtt; |
| } |
| } |
| |
| if (dev->limits.fmr_reserved_mtts) { |
| err = mthca_buddy_init(&dev->mr_table.tavor_fmr.mtt_buddy, fls(mtts - 1)); |
| if (err) |
| goto err_fmr_mtt_buddy; |
| |
| /* Prevent regular MRs from using FMR keys */ |
| err = mthca_buddy_alloc(&dev->mr_table.mtt_buddy, fls(mtts - 1)); |
| if (err) |
| goto err_reserve_fmr; |
| |
| dev->mr_table.fmr_mtt_buddy = |
| &dev->mr_table.tavor_fmr.mtt_buddy; |
| } else |
| dev->mr_table.fmr_mtt_buddy = &dev->mr_table.mtt_buddy; |
| |
| /* FMR table is always the first, take reserved MTTs out of there */ |
| if (dev->limits.reserved_mtts) { |
| i = fls(dev->limits.reserved_mtts - 1); |
| |
| if (mthca_alloc_mtt_range(dev, i, |
| dev->mr_table.fmr_mtt_buddy) == -1) { |
| mthca_warn(dev, "MTT table of order %d is too small.\n", |
| dev->mr_table.fmr_mtt_buddy->max_order); |
| err = -ENOMEM; |
| goto err_reserve_mtts; |
| } |
| } |
| |
| return 0; |
| |
| err_reserve_mtts: |
| err_reserve_fmr: |
| if (dev->limits.fmr_reserved_mtts) |
| mthca_buddy_cleanup(&dev->mr_table.tavor_fmr.mtt_buddy); |
| |
| err_fmr_mtt_buddy: |
| if (dev->mr_table.tavor_fmr.mtt_base) |
| iounmap(dev->mr_table.tavor_fmr.mtt_base); |
| |
| err_fmr_mtt: |
| if (dev->mr_table.tavor_fmr.mpt_base) |
| iounmap(dev->mr_table.tavor_fmr.mpt_base); |
| |
| err_fmr_mpt: |
| mthca_buddy_cleanup(&dev->mr_table.mtt_buddy); |
| |
| err_mtt_buddy: |
| mthca_alloc_cleanup(&dev->mr_table.mpt_alloc); |
| |
| return err; |
| } |
| |
| void mthca_cleanup_mr_table(struct mthca_dev *dev) |
| { |
| /* XXX check if any MRs are still allocated? */ |
| if (dev->limits.fmr_reserved_mtts) |
| mthca_buddy_cleanup(&dev->mr_table.tavor_fmr.mtt_buddy); |
| |
| mthca_buddy_cleanup(&dev->mr_table.mtt_buddy); |
| |
| if (dev->mr_table.tavor_fmr.mtt_base) |
| iounmap(dev->mr_table.tavor_fmr.mtt_base); |
| if (dev->mr_table.tavor_fmr.mpt_base) |
| iounmap(dev->mr_table.tavor_fmr.mpt_base); |
| |
| mthca_alloc_cleanup(&dev->mr_table.mpt_alloc); |
| } |