lists.openwall.net   lists  /  announce  owl-users  owl-dev  john-users  john-dev  passwdqc-users  yescrypt  popa3d-users  /  oss-security  kernel-hardening  musl  sabotage  tlsify  passwords  /  crypt-dev  xvendor  /  Bugtraq  Full-Disclosure  linux-kernel  linux-netdev  linux-ext4  linux-hardening  linux-cve-announce  PHC 
Open Source and information security mailing list archives
 
Hash Suite: Windows password security audit tool. GUI, reports in PDF.
[<prev] [next>] [<thread-prev] [thread-next>] [day] [month] [year] [list]
Message-ID: <20200417201749.GF3083@unreal>
Date:   Fri, 17 Apr 2020 23:17:49 +0300
From:   Leon Romanovsky <leon@...nel.org>
To:     Jeff Kirsher <jeffrey.t.kirsher@...el.com>
Cc:     gregkh@...uxfoundation.org, jgg@...pe.ca,
        Mustafa Ismail <mustafa.ismail@...el.com>,
        netdev@...r.kernel.org, linux-rdma@...r.kernel.org,
        nhorman@...hat.com, sassmann@...hat.com,
        Shiraz Saleem <shiraz.saleem@...el.com>
Subject: Re: [RFC PATCH v5 04/16] RDMA/irdma: Add HMC backing store setup
 functions

On Fri, Apr 17, 2020 at 10:12:39AM -0700, Jeff Kirsher wrote:
> From: Mustafa Ismail <mustafa.ismail@...el.com>
>
> HW uses host memory as a backing store for a number of
> protocol context objects and queue state tracking.
> The Host Memory Cache (HMC) is a component responsible for
> managing these objects stored in host memory.
>
> Add the functions and data structures to manage the allocation
> of backing pages used by the HMC for the various objects
>
> Signed-off-by: Mustafa Ismail <mustafa.ismail@...el.com>
> Signed-off-by: Shiraz Saleem <shiraz.saleem@...el.com>
> ---
>  drivers/infiniband/hw/irdma/hmc.c | 705 ++++++++++++++++++++++++++++++
>  drivers/infiniband/hw/irdma/hmc.h | 217 +++++++++
>  2 files changed, 922 insertions(+)
>  create mode 100644 drivers/infiniband/hw/irdma/hmc.c
>  create mode 100644 drivers/infiniband/hw/irdma/hmc.h
>
> diff --git a/drivers/infiniband/hw/irdma/hmc.c b/drivers/infiniband/hw/irdma/hmc.c
> new file mode 100644
> index 000000000000..a5928030947c
> --- /dev/null
> +++ b/drivers/infiniband/hw/irdma/hmc.c
> @@ -0,0 +1,705 @@
> +// SPDX-License-Identifier: GPL-2.0 or Linux-OpenIB
> +/* Copyright (c) 2015 - 2019 Intel Corporation */
> +#include "osdep.h"
> +#include "status.h"
> +#include "hmc.h"
> +#include "defs.h"
> +#include "type.h"
> +#include "protos.h"
> +
> +/**
> + * irdma_find_sd_index_limit - finds segment descriptor index limit
> + * @hmc_info: pointer to the HMC configuration information structure
> + * @type: type of HMC resources we're searching
> + * @idx: starting index for the object
> + * @cnt: number of objects we're trying to create
> + * @sd_idx: pointer to return index of the segment descriptor in question
> + * @sd_limit: pointer to return the maximum number of segment descriptors
> + *
> + * This function calculates the segment descriptor index and index limit
> + * for the resource defined by irdma_hmc_rsrc_type.
> + */
> +
> +static void irdma_find_sd_index_limit(struct irdma_hmc_info *hmc_info, u32 type,
> +				      u32 idx, u32 cnt, u32 *sd_idx,
> +				      u32 *sd_limit)
> +{
> +	u64 fpm_addr, fpm_limit;
> +
> +	fpm_addr = hmc_info->hmc_obj[(type)].base +
> +		   hmc_info->hmc_obj[type].size * idx;
> +	fpm_limit = fpm_addr + hmc_info->hmc_obj[type].size * cnt;
> +	*sd_idx = (u32)(fpm_addr / IRDMA_HMC_DIRECT_BP_SIZE);
> +	*sd_limit = (u32)((fpm_limit - 1) / IRDMA_HMC_DIRECT_BP_SIZE);
> +	*sd_limit += 1;
> +}
> +
> +/**
> + * irdma_find_pd_index_limit - finds page descriptor index limit
> + * @hmc_info: pointer to the HMC configuration information struct
> + * @type: HMC resource type we're examining
> + * @idx: starting index for the object
> + * @cnt: number of objects we're trying to create
> + * @pd_idx: pointer to return page descriptor index
> + * @pd_limit: pointer to return page descriptor index limit
> + *
> + * Calculates the page descriptor index and index limit for the resource
> + * defined by irdma_hmc_rsrc_type.
> + */
> +
> +static void irdma_find_pd_index_limit(struct irdma_hmc_info *hmc_info, u32 type,
> +				      u32 idx, u32 cnt, u32 *pd_idx,
> +				      u32 *pd_limit)
> +{
> +	u64 fpm_adr, fpm_limit;
> +
> +	fpm_adr = hmc_info->hmc_obj[type].base +
> +		  hmc_info->hmc_obj[type].size * idx;
> +	fpm_limit = fpm_adr + (hmc_info)->hmc_obj[(type)].size * (cnt);
> +	*pd_idx = (u32)(fpm_adr / IRDMA_HMC_PAGED_BP_SIZE);
> +	*pd_limit = (u32)((fpm_limit - 1) / IRDMA_HMC_PAGED_BP_SIZE);
> +	*pd_limit += 1;
> +}
> +
> +/**
> + * irdma_set_sd_entry - setup entry for sd programming
> + * @pa: physical addr
> + * @idx: sd index
> + * @type: paged or direct sd
> + * @entry: sd entry ptr
> + */
> +static void irdma_set_sd_entry(u64 pa, u32 idx, enum irdma_sd_entry_type type,
> +			       struct irdma_update_sd_entry *entry)
> +{
> +	entry->data = pa | (IRDMA_HMC_MAX_BP_COUNT << IRDMA_PFHMC_SDDATALOW_PMSDBPCOUNT_S) |
> +		      (((type == IRDMA_SD_TYPE_PAGED) ? 0 : 1) << IRDMA_PFHMC_SDDATALOW_PMSDTYPE_S) |
> +		      (1 << IRDMA_PFHMC_SDDATALOW_PMSDVALID_S);
> +	entry->cmd = (idx | (1 << IRDMA_PFHMC_SDCMD_PMSDWR_S) | (1 << 15));
> +}
> +
> +/**
> + * irdma_clr_sd_entry - setup entry for sd clear
> + * @idx: sd index
> + * @type: paged or direct sd
> + * @entry: sd entry ptr
> + */
> +static void irdma_clr_sd_entry(u32 idx, enum irdma_sd_entry_type type,
> +			       struct irdma_update_sd_entry *entry)
> +{
> +	entry->data = (IRDMA_HMC_MAX_BP_COUNT << IRDMA_PFHMC_SDDATALOW_PMSDBPCOUNT_S) |
> +		      (((type == IRDMA_SD_TYPE_PAGED) ? 0 : 1) << IRDMA_PFHMC_SDDATALOW_PMSDTYPE_S);
> +	entry->cmd = (idx | (1 << IRDMA_PFHMC_SDCMD_PMSDWR_S) | (1 << 15));
> +}
> +
> +/**
> + * irdma_hmc_sd_one - setup 1 sd entry for cqp
> + * @dev: pointer to the device structure
> + * @hmc_fn_id: hmc's function id
> + * @pa: physical addr
> + * @sd_idx: sd index
> + * @type: paged or direct sd
> + * @setsd: flag to set or clear sd
> + */
> +enum irdma_status_code irdma_hmc_sd_one(struct irdma_sc_dev *dev, u8 hmc_fn_id,
> +					u64 pa, u32 sd_idx,
> +					enum irdma_sd_entry_type type,
> +					bool setsd)
> +{
> +	struct irdma_update_sds_info sdinfo;
> +
> +	sdinfo.cnt = 1;
> +	sdinfo.hmc_fn_id = hmc_fn_id;
> +	if (setsd)
> +		irdma_set_sd_entry(pa, sd_idx, type, sdinfo.entry);
> +	else
> +		irdma_clr_sd_entry(sd_idx, type, sdinfo.entry);
> +	return dev->cqp->process_cqp_sds(dev, &sdinfo);
> +}
> +
> +/**
> + * irdma_hmc_sd_grp - setup group of sd entries for cqp
> + * @dev: pointer to the device structure
> + * @hmc_info: pointer to the HMC configuration information struct
> + * @sd_index: sd index
> + * @sd_cnt: number of sd entries
> + * @setsd: flag to set or clear sd
> + */
> +static enum irdma_status_code irdma_hmc_sd_grp(struct irdma_sc_dev *dev,
> +					       struct irdma_hmc_info *hmc_info,
> +					       u32 sd_index, u32 sd_cnt,
> +					       bool setsd)
> +{
> +	struct irdma_hmc_sd_entry *sd_entry;
> +	struct irdma_update_sds_info sdinfo = {};
> +	u64 pa;
> +	u32 i;
> +	enum irdma_status_code ret_code = 0;
> +
> +	sdinfo.hmc_fn_id = hmc_info->hmc_fn_id;
> +	for (i = sd_index; i < sd_index + sd_cnt; i++) {
> +		sd_entry = &hmc_info->sd_table.sd_entry[i];
> +		if (!sd_entry || (!sd_entry->valid && setsd) ||
> +		    (sd_entry->valid && !setsd))
> +			continue;
> +		if (setsd) {
> +			pa = (sd_entry->entry_type == IRDMA_SD_TYPE_PAGED) ?
> +				     sd_entry->u.pd_table.pd_page_addr.pa :
> +				     sd_entry->u.bp.addr.pa;
> +			irdma_set_sd_entry(pa, i, sd_entry->entry_type,
> +					   &sdinfo.entry[sdinfo.cnt]);
> +		} else {
> +			irdma_clr_sd_entry(i, sd_entry->entry_type,
> +					   &sdinfo.entry[sdinfo.cnt]);
> +		}
> +		sdinfo.cnt++;
> +		if (sdinfo.cnt == IRDMA_MAX_SD_ENTRIES) {
> +			ret_code = dev->cqp->process_cqp_sds(dev, &sdinfo);
> +			if (ret_code) {
> +				dev_dbg(rfdev_to_dev(dev),
> +					"HMC: sd_programming failed err=%d\n",
> +					ret_code);
> +				return ret_code;
> +			}
> +
> +			sdinfo.cnt = 0;
> +		}
> +	}
> +	if (sdinfo.cnt)
> +		ret_code = dev->cqp->process_cqp_sds(dev, &sdinfo);
> +
> +	return ret_code;
> +}
> +
> +/**
> + * irdma_hmc_finish_add_sd_reg - program sd entries for objects
> + * @dev: pointer to the device structure
> + * @info: create obj info
> + */
> +static enum irdma_status_code
> +irdma_hmc_finish_add_sd_reg(struct irdma_sc_dev *dev,
> +			    struct irdma_hmc_create_obj_info *info)
> +{
> +	if (info->start_idx >= info->hmc_info->hmc_obj[info->rsrc_type].cnt)
> +		return IRDMA_ERR_INVALID_HMC_OBJ_INDEX;
> +
> +	if ((info->start_idx + info->count) >
> +	    info->hmc_info->hmc_obj[info->rsrc_type].cnt)
> +		return IRDMA_ERR_INVALID_HMC_OBJ_COUNT;
> +
> +	if (!info->add_sd_cnt)
> +		return 0;
> +	return irdma_hmc_sd_grp(dev, info->hmc_info,
> +				info->hmc_info->sd_indexes[0], info->add_sd_cnt,
> +				true);
> +}
> +
> +/**
> + * irdma_sc_create_hmc_obj - allocate backing store for hmc objects
> + * @dev: pointer to the device structure
> + * @info: pointer to irdma_hmc_create_obj_info struct
> + *
> + * This will allocate memory for PDs and backing pages and populate
> + * the sd and pd entries.
> + */
> +enum irdma_status_code
> +irdma_sc_create_hmc_obj(struct irdma_sc_dev *dev,
> +			struct irdma_hmc_create_obj_info *info)
> +{
> +	struct irdma_hmc_sd_entry *sd_entry;
> +	u32 sd_idx, sd_lmt;
> +	u32 pd_idx = 0, pd_lmt = 0;
> +	u32 pd_idx1 = 0, pd_lmt1 = 0;
> +	u32 i, j;
> +	bool pd_error = false;
> +	enum irdma_status_code ret_code = 0;
> +
> +	if (info->start_idx >= info->hmc_info->hmc_obj[info->rsrc_type].cnt)
> +		return IRDMA_ERR_INVALID_HMC_OBJ_INDEX;
> +
> +	if ((info->start_idx + info->count) >
> +	    info->hmc_info->hmc_obj[info->rsrc_type].cnt) {
> +		dev_dbg(rfdev_to_dev(dev),
> +			"HMC: error type %u, start = %u, req cnt %u, cnt = %u\n",
> +			info->rsrc_type, info->start_idx, info->count,
> +			info->hmc_info->hmc_obj[info->rsrc_type].cnt);
> +		return IRDMA_ERR_INVALID_HMC_OBJ_COUNT;
> +	}
> +
> +	irdma_find_sd_index_limit(info->hmc_info, info->rsrc_type,
> +				  info->start_idx, info->count, &sd_idx,
> +				  &sd_lmt);
> +	if (sd_idx >= info->hmc_info->sd_table.sd_cnt ||
> +	    sd_lmt > info->hmc_info->sd_table.sd_cnt) {
> +		return IRDMA_ERR_INVALID_SD_INDEX;
> +	}
> +
> +	irdma_find_pd_index_limit(info->hmc_info, info->rsrc_type,
> +				  info->start_idx, info->count, &pd_idx,
> +				  &pd_lmt);
> +
> +	for (j = sd_idx; j < sd_lmt; j++) {
> +		ret_code = irdma_add_sd_table_entry(dev->hw, info->hmc_info, j,
> +						    info->entry_type,
> +						    IRDMA_HMC_DIRECT_BP_SIZE);
> +		if (ret_code)
> +			goto exit_sd_error;
> +
> +		sd_entry = &info->hmc_info->sd_table.sd_entry[j];
> +		if (sd_entry->entry_type == IRDMA_SD_TYPE_PAGED &&
> +		    (dev->hmc_info == info->hmc_info &&
> +		     info->rsrc_type != IRDMA_HMC_IW_PBLE)) {
> +			pd_idx1 = max(pd_idx, (j * IRDMA_HMC_MAX_BP_COUNT));
> +			pd_lmt1 = min(pd_lmt, (j + 1) * IRDMA_HMC_MAX_BP_COUNT);
> +			for (i = pd_idx1; i < pd_lmt1; i++) {
> +				/* update the pd table entry */
> +				ret_code = irdma_add_pd_table_entry(dev,
> +								    info->hmc_info,
> +								    i, NULL);
> +				if (ret_code) {
> +					pd_error = true;
> +					break;
> +				}
> +			}
> +			if (pd_error) {
> +				while (i && (i > pd_idx1)) {
> +					irdma_remove_pd_bp(dev, info->hmc_info,
> +							   i - 1);
> +					i--;
> +				}
> +			}
> +		}
> +		if (sd_entry->valid)
> +			continue;
> +
> +		info->hmc_info->sd_indexes[info->add_sd_cnt] = (u16)j;
> +		info->add_sd_cnt++;
> +		sd_entry->valid = true;
> +	}
> +	return irdma_hmc_finish_add_sd_reg(dev, info);
> +
> +exit_sd_error:
> +	while (j && (j > sd_idx)) {
> +		sd_entry = &info->hmc_info->sd_table.sd_entry[j - 1];
> +		switch (sd_entry->entry_type) {
> +		case IRDMA_SD_TYPE_PAGED:
> +			pd_idx1 = max(pd_idx, (j - 1) * IRDMA_HMC_MAX_BP_COUNT);
> +			pd_lmt1 = min(pd_lmt, (j * IRDMA_HMC_MAX_BP_COUNT));
> +			for (i = pd_idx1; i < pd_lmt1; i++)
> +				irdma_prep_remove_pd_page(info->hmc_info, i);
> +			break;
> +		case IRDMA_SD_TYPE_DIRECT:
> +			irdma_prep_remove_pd_page(info->hmc_info, (j - 1));
> +			break;
> +		default:
> +			ret_code = IRDMA_ERR_INVALID_SD_TYPE;
> +			break;
> +		}
> +		j--;
> +	}
> +
> +	return ret_code;
> +}
> +
> +/**
> + * irdma_finish_del_sd_reg - delete sd entries for objects
> + * @dev: pointer to the device structure
> + * @info: dele obj info
> + * @reset: true if called before reset
> + */
> +static enum irdma_status_code
> +irdma_finish_del_sd_reg(struct irdma_sc_dev *dev,
> +			struct irdma_hmc_del_obj_info *info, bool reset)
> +{
> +	struct irdma_hmc_sd_entry *sd_entry;
> +	enum irdma_status_code ret_code = 0;
> +	u32 i, sd_idx;
> +	struct irdma_dma_mem *mem;
> +
> +	if (dev->privileged && !reset)
> +		ret_code = irdma_hmc_sd_grp(dev, info->hmc_info,
> +					    info->hmc_info->sd_indexes[0],
> +					    info->del_sd_cnt, false);
> +
> +	if (ret_code)
> +		dev_dbg(rfdev_to_dev(dev), "HMC: error cqp sd sd_grp\n");
> +	for (i = 0; i < info->del_sd_cnt; i++) {
> +		sd_idx = info->hmc_info->sd_indexes[i];
> +		sd_entry = &info->hmc_info->sd_table.sd_entry[sd_idx];
> +		if (!sd_entry)
> +			continue;
> +		mem = (sd_entry->entry_type == IRDMA_SD_TYPE_PAGED) ?
> +			      &sd_entry->u.pd_table.pd_page_addr :
> +			      &sd_entry->u.bp.addr;
> +
> +		if (!mem || !mem->va) {
> +			dev_dbg(rfdev_to_dev(dev), "HMC: error cqp sd mem\n");
> +		} else {
> +			dma_free_coherent(hw_to_dev(dev->hw), mem->size,
> +					  mem->va, mem->pa);
> +			mem->va = NULL;
> +		}
> +	}
> +
> +	return ret_code;
> +}
> +
> +/**
> + * irdma_sc_del_hmc_obj - remove pe hmc objects
> + * @dev: pointer to the device structure
> + * @info: pointer to irdma_hmc_del_obj_info struct
> + * @reset: true if called before reset
> + *
> + * This will de-populate the SDs and PDs.  It frees
> + * the memory for PDS and backing storage.  After this function is returned,
> + * caller should deallocate memory allocated previously for
> + * book-keeping information about PDs and backing storage.
> + */
> +enum irdma_status_code irdma_sc_del_hmc_obj(struct irdma_sc_dev *dev,
> +					    struct irdma_hmc_del_obj_info *info,
> +					    bool reset)
> +{
> +	struct irdma_hmc_pd_table *pd_table;
> +	u32 sd_idx, sd_lmt;
> +	u32 pd_idx, pd_lmt, rel_pd_idx;
> +	u32 i, j;
> +	enum irdma_status_code ret_code = 0;
> +
> +	if (info->start_idx >= info->hmc_info->hmc_obj[info->rsrc_type].cnt) {
> +		dev_dbg(rfdev_to_dev(dev),
> +			"HMC: error start_idx[%04d]  >= [type %04d].cnt[%04d]\n",
> +			info->start_idx, info->rsrc_type,
> +			info->hmc_info->hmc_obj[info->rsrc_type].cnt);
> +		return IRDMA_ERR_INVALID_HMC_OBJ_INDEX;
> +	}
> +
> +	if ((info->start_idx + info->count) >
> +	    info->hmc_info->hmc_obj[info->rsrc_type].cnt) {
> +		dev_dbg(rfdev_to_dev(dev),
> +			"HMC: error start_idx[%04d] + count %04d  >= [type %04d].cnt[%04d]\n",
> +			info->start_idx, info->count, info->rsrc_type,
> +			info->hmc_info->hmc_obj[info->rsrc_type].cnt);
> +		return IRDMA_ERR_INVALID_HMC_OBJ_COUNT;
> +	}
> +
> +	irdma_find_pd_index_limit(info->hmc_info, info->rsrc_type,
> +				  info->start_idx, info->count, &pd_idx,
> +				  &pd_lmt);
> +
> +	for (j = pd_idx; j < pd_lmt; j++) {
> +		sd_idx = j / IRDMA_HMC_PD_CNT_IN_SD;
> +
> +		if (!info->hmc_info->sd_table.sd_entry[sd_idx].valid)
> +			continue;
> +
> +		if (info->hmc_info->sd_table.sd_entry[sd_idx].entry_type !=
> +		    IRDMA_SD_TYPE_PAGED)
> +			continue;
> +
> +		rel_pd_idx = j % IRDMA_HMC_PD_CNT_IN_SD;
> +		pd_table = &info->hmc_info->sd_table.sd_entry[sd_idx].u.pd_table;
> +		if (pd_table->pd_entry &&
> +		    pd_table->pd_entry[rel_pd_idx].valid) {
> +			ret_code = irdma_remove_pd_bp(dev, info->hmc_info, j);
> +			if (ret_code) {
> +				dev_dbg(rfdev_to_dev(dev),
> +					"HMC: remove_pd_bp error\n");
> +				return ret_code;
> +			}
> +		}
> +	}
> +
> +	irdma_find_sd_index_limit(info->hmc_info, info->rsrc_type,
> +				  info->start_idx, info->count, &sd_idx,
> +				  &sd_lmt);
> +	if (sd_idx >= info->hmc_info->sd_table.sd_cnt ||
> +	    sd_lmt > info->hmc_info->sd_table.sd_cnt) {
> +		dev_dbg(rfdev_to_dev(dev), "HMC: invalid sd_idx\n");
> +		return IRDMA_ERR_INVALID_SD_INDEX;
> +	}
> +
> +	for (i = sd_idx; i < sd_lmt; i++) {
> +		pd_table = &info->hmc_info->sd_table.sd_entry[i].u.pd_table;
> +		if (!info->hmc_info->sd_table.sd_entry[i].valid)
> +			continue;
> +		switch (info->hmc_info->sd_table.sd_entry[i].entry_type) {
> +		case IRDMA_SD_TYPE_DIRECT:
> +			ret_code = irdma_prep_remove_sd_bp(info->hmc_info, i);
> +			if (!ret_code) {
> +				info->hmc_info->sd_indexes[info->del_sd_cnt] =
> +					(u16)i;
> +				info->del_sd_cnt++;
> +			}
> +			break;
> +		case IRDMA_SD_TYPE_PAGED:
> +			ret_code = irdma_prep_remove_pd_page(info->hmc_info, i);
> +			if (ret_code)
> +				break;
> +			if (dev->hmc_info != info->hmc_info &&
> +			    info->rsrc_type == IRDMA_HMC_IW_PBLE &&
> +			    pd_table->pd_entry) {
> +				kfree(pd_table->pd_entry_virt_mem.va);
> +				pd_table->pd_entry = NULL;
> +			}
> +			info->hmc_info->sd_indexes[info->del_sd_cnt] = (u16)i;
> +			info->del_sd_cnt++;
> +			break;
> +		default:
> +			break;
> +		}
> +	}
> +	return irdma_finish_del_sd_reg(dev, info, reset);
> +}
> +
> +/**
> + * irdma_add_sd_table_entry - Adds a segment descriptor to the table
> + * @hw: pointer to our hw struct
> + * @hmc_info: pointer to the HMC configuration information struct
> + * @sd_index: segment descriptor index to manipulate
> + * @type: what type of segment descriptor we're manipulating
> + * @direct_mode_sz: size to alloc in direct mode
> + */
> +enum irdma_status_code irdma_add_sd_table_entry(struct irdma_hw *hw,
> +						struct irdma_hmc_info *hmc_info,
> +						u32 sd_index,
> +						enum irdma_sd_entry_type type,
> +						u64 direct_mode_sz)
> +{
> +	struct irdma_hmc_sd_entry *sd_entry;
> +	struct irdma_dma_mem dma_mem;
> +	u64 alloc_len;
> +
> +	sd_entry = &hmc_info->sd_table.sd_entry[sd_index];
> +	if (!sd_entry->valid) {
> +		if (type == IRDMA_SD_TYPE_PAGED)
> +			alloc_len = IRDMA_HMC_PAGED_BP_SIZE;
> +		else
> +			alloc_len = direct_mode_sz;
> +
> +		/* allocate a 4K pd page or 2M backing page */
> +		dma_mem.size = ALIGN(alloc_len, IRDMA_HMC_PD_BP_BUF_ALIGNMENT);
> +		dma_mem.va = dma_alloc_coherent(hw_to_dev(hw),
> +						dma_mem.size, &dma_mem.pa,
> +						GFP_ATOMIC);
> +		if (!dma_mem.va)
> +			return IRDMA_ERR_NO_MEMORY;
> +
> +		if (type == IRDMA_SD_TYPE_PAGED) {
> +			struct irdma_virt_mem *vmem =
> +				&sd_entry->u.pd_table.pd_entry_virt_mem;
> +
> +			vmem->size = sizeof(struct irdma_hmc_pd_entry) * 512;
> +			vmem->va = kzalloc(vmem->size, GFP_ATOMIC);
> +			if (!vmem->va) {
> +				dma_free_coherent(hw_to_dev(hw), dma_mem.size,
> +						  dma_mem.va, dma_mem.pa);
> +				dma_mem.va = NULL;
> +				return IRDMA_ERR_NO_MEMORY;
> +			}
> +			sd_entry->u.pd_table.pd_entry = vmem->va;
> +
> +			memcpy(&sd_entry->u.pd_table.pd_page_addr, &dma_mem,
> +			       sizeof(sd_entry->u.pd_table.pd_page_addr));
> +		} else {
> +			memcpy(&sd_entry->u.bp.addr, &dma_mem,
> +			       sizeof(sd_entry->u.bp.addr));
> +
> +			sd_entry->u.bp.sd_pd_index = sd_index;
> +		}
> +
> +		hmc_info->sd_table.sd_entry[sd_index].entry_type = type;
> +		IRDMA_INC_SD_REFCNT(&hmc_info->sd_table);
> +	}
> +	if (sd_entry->entry_type == IRDMA_SD_TYPE_DIRECT)
> +		IRDMA_INC_BP_REFCNT(&sd_entry->u.bp);
> +
> +	return 0;
> +}
> +
> +/**
> + * irdma_add_pd_table_entry - Adds page descriptor to the specified table
> + * @dev: pointer to our device structure
> + * @hmc_info: pointer to the HMC configuration information structure
> + * @pd_index: which page descriptor index to manipulate
> + * @rsrc_pg: if not NULL, use preallocated page instead of allocating new one.
> + *
> + * This function:
> + *	1. Initializes the pd entry
> + *	2. Adds pd_entry in the pd_table
> + *	3. Mark the entry valid in irdma_hmc_pd_entry structure
> + *	4. Initializes the pd_entry's ref count to 1
> + * assumptions:
> + *	1. The memory for pd should be pinned down, physically contiguous and
> + *	   aligned on 4K boundary and zeroed memory.
> + *	2. It should be 4K in size.
> + */
> +enum irdma_status_code irdma_add_pd_table_entry(struct irdma_sc_dev *dev,
> +						struct irdma_hmc_info *hmc_info,
> +						u32 pd_index,
> +						struct irdma_dma_mem *rsrc_pg)
> +{
> +	struct irdma_hmc_pd_table *pd_table;
> +	struct irdma_hmc_pd_entry *pd_entry;
> +	struct irdma_dma_mem mem;
> +	struct irdma_dma_mem *page = &mem;
> +	u32 sd_idx, rel_pd_idx;
> +	u64 *pd_addr;
> +	u64 page_desc;
> +
> +	if (pd_index / IRDMA_HMC_PD_CNT_IN_SD >= hmc_info->sd_table.sd_cnt)
> +		return IRDMA_ERR_INVALID_PAGE_DESC_INDEX;
> +
> +	sd_idx = (pd_index / IRDMA_HMC_PD_CNT_IN_SD);
> +	if (hmc_info->sd_table.sd_entry[sd_idx].entry_type !=
> +	    IRDMA_SD_TYPE_PAGED)
> +		return 0;
> +
> +	rel_pd_idx = (pd_index % IRDMA_HMC_PD_CNT_IN_SD);
> +	pd_table = &hmc_info->sd_table.sd_entry[sd_idx].u.pd_table;
> +	pd_entry = &pd_table->pd_entry[rel_pd_idx];
> +	if (!pd_entry->valid) {
> +		if (rsrc_pg) {
> +			pd_entry->rsrc_pg = true;
> +			page = rsrc_pg;
> +		} else {
> +			page->size = ALIGN(IRDMA_HMC_PAGED_BP_SIZE,
> +					   IRDMA_HMC_PD_BP_BUF_ALIGNMENT);
> +			page->va = dma_alloc_coherent(hw_to_dev(dev->hw),
> +						      page->size, &page->pa,
> +						      GFP_KERNEL);
> +			if (!page->va)
> +				return IRDMA_ERR_NO_MEMORY;
> +
> +			pd_entry->rsrc_pg = false;
> +		}
> +
> +		memcpy(&pd_entry->bp.addr, page, sizeof(pd_entry->bp.addr));
> +		pd_entry->bp.sd_pd_index = pd_index;
> +		pd_entry->bp.entry_type = IRDMA_SD_TYPE_PAGED;
> +		page_desc = page->pa | 0x1;
> +		pd_addr = pd_table->pd_page_addr.va;
> +		pd_addr += rel_pd_idx;
> +		memcpy(pd_addr, &page_desc, sizeof(*pd_addr));
> +		pd_entry->sd_index = sd_idx;
> +		pd_entry->valid = true;
> +		IRDMA_INC_PD_REFCNT(pd_table);
> +		if (hmc_info->hmc_fn_id < dev->hw_attrs.first_hw_vf_fpm_id)
> +			IRDMA_INVALIDATE_PF_HMC_PD(dev, sd_idx, rel_pd_idx);
> +		else if (dev->hw->hmc.hmc_fn_id != hmc_info->hmc_fn_id)
> +			IRDMA_INVALIDATE_VF_HMC_PD(dev, sd_idx, rel_pd_idx,
> +						   hmc_info->hmc_fn_id);
> +	}
> +	IRDMA_INC_BP_REFCNT(&pd_entry->bp);
> +
> +	return 0;
> +}
> +
> +/**
> + * irdma_remove_pd_bp - remove a backing page from a page descriptor
> + * @dev: pointer to our HW structure
> + * @hmc_info: pointer to the HMC configuration information structure
> + * @idx: the page index
> + *
> + * This function:
> + *	1. Marks the entry in pd table (for paged address mode) or in sd table
> + *	   (for direct address mode) invalid.
> + *	2. Write to register PMPDINV to invalidate the backing page in FV cache
> + *	3. Decrement the ref count for the pd _entry
> + * assumptions:
> + *	1. Caller can deallocate the memory used by backing storage after this
> + *	   function returns.
> + */
> +enum irdma_status_code irdma_remove_pd_bp(struct irdma_sc_dev *dev,
> +					  struct irdma_hmc_info *hmc_info,
> +					  u32 idx)
> +{
> +	struct irdma_hmc_pd_entry *pd_entry;
> +	struct irdma_hmc_pd_table *pd_table;
> +	struct irdma_hmc_sd_entry *sd_entry;
> +	u32 sd_idx, rel_pd_idx;
> +	struct irdma_dma_mem *mem;
> +	u64 *pd_addr;
> +
> +	sd_idx = idx / IRDMA_HMC_PD_CNT_IN_SD;
> +	rel_pd_idx = idx % IRDMA_HMC_PD_CNT_IN_SD;
> +	if (sd_idx >= hmc_info->sd_table.sd_cnt)
> +		return IRDMA_ERR_INVALID_PAGE_DESC_INDEX;
> +
> +	sd_entry = &hmc_info->sd_table.sd_entry[sd_idx];
> +	if (sd_entry->entry_type != IRDMA_SD_TYPE_PAGED)
> +		return IRDMA_ERR_INVALID_SD_TYPE;
> +
> +	pd_table = &hmc_info->sd_table.sd_entry[sd_idx].u.pd_table;
> +	pd_entry = &pd_table->pd_entry[rel_pd_idx];
> +	IRDMA_DEC_BP_REFCNT(&pd_entry->bp);
> +	if (pd_entry->bp.ref_cnt)
> +		return 0;
> +
> +	pd_entry->valid = false;
> +	IRDMA_DEC_PD_REFCNT(pd_table);
> +	pd_addr = pd_table->pd_page_addr.va;
> +	pd_addr += rel_pd_idx;
> +	memset(pd_addr, 0, sizeof(u64));
> +	if (dev->privileged) {
> +		if (dev->hmc_fn_id == hmc_info->hmc_fn_id)
> +			IRDMA_INVALIDATE_PF_HMC_PD(dev, sd_idx, idx);
> +		else
> +			IRDMA_INVALIDATE_VF_HMC_PD(dev, sd_idx, idx,
> +						   hmc_info->hmc_fn_id);
> +	}
> +
> +	if (!pd_entry->rsrc_pg) {
> +		mem = &pd_entry->bp.addr;
> +		if (!mem || !mem->va)
> +			return IRDMA_ERR_PARAM;
> +
> +		dma_free_coherent(hw_to_dev(dev->hw), mem->size, mem->va,
> +				  mem->pa);
> +		mem->va = NULL;
> +	}
> +	if (!pd_table->ref_cnt)
> +		kfree(pd_table->pd_entry_virt_mem.va);
> +
> +	return 0;
> +}
> +
> +/**
> + * irdma_prep_remove_sd_bp - Prepares to remove a backing page from a sd entry
> + * @hmc_info: pointer to the HMC configuration information structure
> + * @idx: the page index
> + */
> +enum irdma_status_code irdma_prep_remove_sd_bp(struct irdma_hmc_info *hmc_info,
> +					       u32 idx)
> +{
> +	struct irdma_hmc_sd_entry *sd_entry;
> +
> +	sd_entry = &hmc_info->sd_table.sd_entry[idx];
> +	IRDMA_DEC_BP_REFCNT(&sd_entry->u.bp);
> +	if (sd_entry->u.bp.ref_cnt)
> +		return IRDMA_ERR_NOT_READY;
> +
> +	IRDMA_DEC_SD_REFCNT(&hmc_info->sd_table);
> +	sd_entry->valid = false;
> +
> +	return 0;
> +}
> +
> +/**
> + * irdma_prep_remove_pd_page - Prepares to remove a PD page from sd entry.
> + * @hmc_info: pointer to the HMC configuration information structure
> + * @idx: segment descriptor index to find the relevant page descriptor
> + */
> +enum irdma_status_code
> +irdma_prep_remove_pd_page(struct irdma_hmc_info *hmc_info, u32 idx)
> +{
> +	struct irdma_hmc_sd_entry *sd_entry;
> +
> +	sd_entry = &hmc_info->sd_table.sd_entry[idx];
> +
> +	if (sd_entry->u.pd_table.ref_cnt)
> +		return IRDMA_ERR_NOT_READY;
> +
> +	sd_entry->valid = false;
> +	IRDMA_DEC_SD_REFCNT(&hmc_info->sd_table);
> +
> +	return 0;
> +}
> diff --git a/drivers/infiniband/hw/irdma/hmc.h b/drivers/infiniband/hw/irdma/hmc.h
> new file mode 100644
> index 000000000000..6f3fbf61f048
> --- /dev/null
> +++ b/drivers/infiniband/hw/irdma/hmc.h
> @@ -0,0 +1,217 @@
> +/* SPDX-License-Identifier: GPL-2.0 or Linux-OpenIB */
> +/* Copyright (c) 2015 - 2019 Intel Corporation */
> +#ifndef IRDMA_HMC_H
> +#define IRDMA_HMC_H
> +
> +#include "defs.h"
> +
> +#define IRDMA_HMC_MAX_BP_COUNT			512
> +#define IRDMA_MAX_SD_ENTRIES			11
> +#define IRDMA_HW_DBG_HMC_INVALID_BP_MARK	0xca
> +#define IRDMA_HMC_INFO_SIGNATURE		0x484d5347
> +#define IRDMA_HMC_PD_CNT_IN_SD			512
> +#define IRDMA_HMC_DIRECT_BP_SIZE		0x200000
> +#define IRDMA_HMC_MAX_SD_COUNT			8192
> +#define IRDMA_HMC_PAGED_BP_SIZE			4096
> +#define IRDMA_HMC_PD_BP_BUF_ALIGNMENT		4096
> +#define IRDMA_FIRST_VF_FPM_ID			8
> +#define FPM_MULTIPLIER				1024
> +
> +#define IRDMA_INC_SD_REFCNT(sd_table)	((sd_table)->ref_cnt++)
> +#define IRDMA_INC_PD_REFCNT(pd_table)	((pd_table)->ref_cnt++)
> +#define IRDMA_INC_BP_REFCNT(bp)		((bp)->ref_cnt++)
> +
> +#define IRDMA_DEC_SD_REFCNT(sd_table)	((sd_table)->ref_cnt--)
> +#define IRDMA_DEC_PD_REFCNT(pd_table)	((pd_table)->ref_cnt--)
> +#define IRDMA_DEC_BP_REFCNT(bp)		((bp)->ref_cnt--)

It is bad for two reasons, first you obfuscated simple ++/-- and second
you called it refcnt, while we have special type for that.

Thanks

Powered by blists - more mailing lists

Powered by Openwall GNU/*/Linux Powered by OpenVZ