Quelle kfd_device_queue_manager.c Sprache: C

// SPDX-License-Identifier: GPL-2.0 OR MIT
/*
* Copyright 2014-2022 Advanced Micro Devices, Inc.
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the "Software"),
* to deal in the Software without restriction, including without limitation
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
* and/or sell copies of the Software, and to permit persons to whom the
* Software is furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice shall be included in
* all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
* THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
* OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
* ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
* OTHER DEALINGS IN THE SOFTWARE.
*
*/

#include <linux/ratelimit.h>
#include <linux/printk.h>
#include <linux/slab.h>
#include <linux/list.h>
#include <linux/types.h>
#include <linux/bitops.h>
#include <linux/sched.h>
#include "kfd_priv.h"
#include "kfd_device_queue_manager.h"
#include "kfd_mqd_manager.h"
#include "cik_regs.h"
#include "kfd_kernel_queue.h"
#include "amdgpu_amdkfd.h"
#include "amdgpu_reset.h"
#include "amdgpu_sdma.h"
#include "mes_v11_api_def.h"
#include "kfd_debug.h"

/* Size of the per-pipe EOP queue */
#define CIK_HPD_EOP_BYTES_LOG2 11
#define CIK_HPD_EOP_BYTES (1U << CIK_HPD_EOP_BYTES_LOG2)
/* See unmap_queues_cpsch() */
#define USE_DEFAULT_GRACE_PERIOD 0xffffffff

static int set_pasid_vmid_mapping(struct device_queue_manager *dqm,
      u32 pasid, unsigned int vmid);

static int execute_queues_cpsch(struct device_queue_manager *dqm,
    enum kfd_unmap_queues_filter filter,
    uint32_t filter_param,
    uint32_t grace_period);
static int unmap_queues_cpsch(struct device_queue_manager *dqm,
    enum kfd_unmap_queues_filter filter,
    uint32_t filter_param,
    uint32_t grace_period,
    bool reset);

static int map_queues_cpsch(struct device_queue_manager *dqm);

static void deallocate_sdma_queue(struct device_queue_manager *dqm,
    struct queue *q);

static inline void deallocate_hqd(struct device_queue_manager *dqm,
    struct queue *q);
static int allocate_hqd(struct device_queue_manager *dqm, struct queue *q);
static int allocate_sdma_queue(struct device_queue_manager *dqm,
    struct queue *q, const uint32_t *restore_sdma_id);

static int reset_queues_on_hws_hang(struct device_queue_manager *dqm, bool is_sdma);

static inline
enum KFD_MQD_TYPE get_mqd_type_from_queue_type(enum kfd_queue_type type)
{
if (type == KFD_QUEUE_TYPE_SDMA || type == KFD_QUEUE_TYPE_SDMA_XGMI)
  return KFD_MQD_TYPE_SDMA;
return KFD_MQD_TYPE_CP;
}

static bool is_pipe_enabled(struct device_queue_manager *dqm, int mec, int pipe)
{
int i;
int pipe_offset = (mec * dqm->dev->kfd->shared_resources.num_pipe_per_mec
  + pipe) * dqm->dev->kfd->shared_resources.num_queue_per_pipe;

/* queue is available for KFD usage if bit is 1 */
for (i = 0; i <  dqm->dev->kfd->shared_resources.num_queue_per_pipe; ++i)
  if (test_bit(pipe_offset + i,
         dqm->dev->kfd->shared_resources.cp_queue_bitmap))
   return true;
return false;
}

unsigned int get_cp_queues_num(struct device_queue_manager *dqm)
{
return bitmap_weight(dqm->dev->kfd->shared_resources.cp_queue_bitmap,
    AMDGPU_MAX_QUEUES);
}

unsigned int get_queues_per_pipe(struct device_queue_manager *dqm)
{
return dqm->dev->kfd->shared_resources.num_queue_per_pipe;
}

unsigned int get_pipes_per_mec(struct device_queue_manager *dqm)
{
return dqm->dev->kfd->shared_resources.num_pipe_per_mec;
}

static unsigned int get_num_all_sdma_engines(struct device_queue_manager *dqm)
{
return kfd_get_num_sdma_engines(dqm->dev) +
  kfd_get_num_xgmi_sdma_engines(dqm->dev);
}

unsigned int get_num_sdma_queues(struct device_queue_manager *dqm)
{
return kfd_get_num_sdma_engines(dqm->dev) *
  dqm->dev->kfd->device_info.num_sdma_queues_per_engine;
}

unsigned int get_num_xgmi_sdma_queues(struct device_queue_manager *dqm)
{
return kfd_get_num_xgmi_sdma_engines(dqm->dev) *
  dqm->dev->kfd->device_info.num_sdma_queues_per_engine;
}

static void init_sdma_bitmaps(struct device_queue_manager *dqm)
{
bitmap_zero(dqm->sdma_bitmap, KFD_MAX_SDMA_QUEUES);
bitmap_set(dqm->sdma_bitmap, 0, get_num_sdma_queues(dqm));

bitmap_zero(dqm->xgmi_sdma_bitmap, KFD_MAX_SDMA_QUEUES);
bitmap_set(dqm->xgmi_sdma_bitmap, 0, get_num_xgmi_sdma_queues(dqm));

/* Mask out the reserved queues */
bitmap_andnot(dqm->sdma_bitmap, dqm->sdma_bitmap,
        dqm->dev->kfd->device_info.reserved_sdma_queues_bitmap,
        KFD_MAX_SDMA_QUEUES);
}

void program_sh_mem_settings(struct device_queue_manager *dqm,
     struct qcm_process_device *qpd)
{
uint32_t xcc_mask = dqm->dev->xcc_mask;
int xcc_id;

for_each_inst(xcc_id, xcc_mask)
  dqm->dev->kfd2kgd->program_sh_mem_settings(
   dqm->dev->adev, qpd->vmid, qpd->sh_mem_config,
   qpd->sh_mem_ape1_base, qpd->sh_mem_ape1_limit,
   qpd->sh_mem_bases, xcc_id);
}

static void kfd_hws_hang(struct device_queue_manager *dqm)
{
struct device_process_node *cur;
struct qcm_process_device *qpd;
struct queue *q;

/* Mark all device queues as reset. */
list_for_each_entry(cur, &dqm->queues, list) {
  qpd = cur->qpd;
  list_for_each_entry(q, &qpd->queues_list, list) {
   struct kfd_process_device *pdd = qpd_to_pdd(qpd);

   pdd->has_reset_queue = true;
  }
}

/*
* Issue a GPU reset if HWS is unresponsive
*/
amdgpu_amdkfd_gpu_reset(dqm->dev->adev);
}

static int convert_to_mes_queue_type(int queue_type)
{
int mes_queue_type;

switch (queue_type) {
case KFD_QUEUE_TYPE_COMPUTE:
  mes_queue_type = MES_QUEUE_TYPE_COMPUTE;
  break;
case KFD_QUEUE_TYPE_SDMA:
  mes_queue_type = MES_QUEUE_TYPE_SDMA;
  break;
default:
  WARN(1, "Invalid queue type %d", queue_type);
  mes_queue_type = -EINVAL;
  break;
}

return mes_queue_type;
}

static int add_queue_mes(struct device_queue_manager *dqm, struct queue *q,
    struct qcm_process_device *qpd)
{
struct amdgpu_device *adev = (struct amdgpu_device *)dqm->dev->adev;
struct kfd_process_device *pdd = qpd_to_pdd(qpd);
struct mes_add_queue_input queue_input;
int r, queue_type;
uint64_t wptr_addr_off;

if (!dqm->sched_running || dqm->sched_halt)
  return 0;
if (!down_read_trylock(&adev->reset_domain->sem))
  return -EIO;

memset(&queue_input, 0x0, sizeof(struct mes_add_queue_input));
queue_input.process_id = pdd->pasid;
queue_input.page_table_base_addr =  qpd->page_table_base;
queue_input.process_va_start = 0;
queue_input.process_va_end = adev->vm_manager.max_pfn - 1;
/* MES unit for quantum is 100ns */
queue_input.process_quantum = KFD_MES_PROCESS_QUANTUM;  /* Equivalent to 10ms. */
queue_input.process_context_addr = pdd->proc_ctx_gpu_addr;
queue_input.gang_quantum = KFD_MES_GANG_QUANTUM; /* Equivalent to 1ms */
queue_input.gang_context_addr = q->gang_ctx_gpu_addr;
queue_input.inprocess_gang_priority = q->properties.priority;
queue_input.gang_global_priority_level =
     AMDGPU_MES_PRIORITY_LEVEL_NORMAL;
queue_input.doorbell_offset = q->properties.doorbell_off;
queue_input.mqd_addr = q->gart_mqd_addr;
queue_input.wptr_addr = (uint64_t)q->properties.write_ptr;

wptr_addr_off = (uint64_t)q->properties.write_ptr & (PAGE_SIZE - 1);
queue_input.wptr_mc_addr = amdgpu_bo_gpu_offset(q->properties.wptr_bo) + wptr_addr_off;

queue_input.is_kfd_process = 1;
queue_input.is_aql_queue = (q->properties.format == KFD_QUEUE_FORMAT_AQL);
queue_input.queue_size = q->properties.queue_size >> 2;

queue_input.paging = false;
queue_input.tba_addr = qpd->tba_addr;
queue_input.tma_addr = qpd->tma_addr;
queue_input.trap_en = !kfd_dbg_has_cwsr_workaround(q->device);
queue_input.skip_process_ctx_clear =
  qpd->pqm->process->runtime_info.runtime_state == DEBUG_RUNTIME_STATE_ENABLED &&
      (qpd->pqm->process->debug_trap_enabled ||
       kfd_dbg_has_ttmps_always_setup(q->device));

queue_type = convert_to_mes_queue_type(q->properties.type);
if (queue_type < 0) {
  dev_err(adev->dev, "Queue type not supported with MES, queue:%d\n",
   q->properties.type);
  up_read(&adev->reset_domain->sem);
  return -EINVAL;
}
queue_input.queue_type = (uint32_t)queue_type;

queue_input.exclusively_scheduled = q->properties.is_gws;

amdgpu_mes_lock(&adev->mes);
r = adev->mes.funcs->add_hw_queue(&adev->mes, &queue_input);
amdgpu_mes_unlock(&adev->mes);
up_read(&adev->reset_domain->sem);
if (r) {
  dev_err(adev->dev, "failed to add hardware queue to MES, doorbell=0x%x\n",
   q->properties.doorbell_off);
  dev_err(adev->dev, "MES might be in unrecoverable state, issue a GPU reset\n");
  kfd_hws_hang(dqm);
}

return r;
}

static int remove_queue_mes(struct device_queue_manager *dqm, struct queue *q,
   struct qcm_process_device *qpd)
{
struct amdgpu_device *adev = (struct amdgpu_device *)dqm->dev->adev;
int r;
struct mes_remove_queue_input queue_input;

if (!dqm->sched_running || dqm->sched_halt)
  return 0;
if (!down_read_trylock(&adev->reset_domain->sem))
  return -EIO;

memset(&queue_input, 0x0, sizeof(struct mes_remove_queue_input));
queue_input.doorbell_offset = q->properties.doorbell_off;
queue_input.gang_context_addr = q->gang_ctx_gpu_addr;

amdgpu_mes_lock(&adev->mes);
r = adev->mes.funcs->remove_hw_queue(&adev->mes, &queue_input);
amdgpu_mes_unlock(&adev->mes);
up_read(&adev->reset_domain->sem);

if (r) {
  dev_err(adev->dev, "failed to remove hardware queue from MES, doorbell=0x%x\n",
   q->properties.doorbell_off);
  dev_err(adev->dev, "MES might be in unrecoverable state, issue a GPU reset\n");
  kfd_hws_hang(dqm);
}

return r;
}

static int remove_all_kfd_queues_mes(struct device_queue_manager *dqm)
{
struct device_process_node *cur;
struct device *dev = dqm->dev->adev->dev;
struct qcm_process_device *qpd;
struct queue *q;
int retval = 0;

list_for_each_entry(cur, &dqm->queues, list) {
  qpd = cur->qpd;
  list_for_each_entry(q, &qpd->queues_list, list) {
   if (q->properties.is_active) {
    retval = remove_queue_mes(dqm, q, qpd);
    if (retval) {
     dev_err(dev, "%s: Failed to remove queue %d for dev %d",
      __func__,
      q->properties.queue_id,
      dqm->dev->id);
     return retval;
    }
   }
  }
}

return retval;
}

static int add_all_kfd_queues_mes(struct device_queue_manager *dqm)
{
struct device_process_node *cur;
struct device *dev = dqm->dev->adev->dev;
struct qcm_process_device *qpd;
struct queue *q;
int retval = 0;

list_for_each_entry(cur, &dqm->queues, list) {
  qpd = cur->qpd;
  list_for_each_entry(q, &qpd->queues_list, list) {
   if (!q->properties.is_active)
    continue;
   retval = add_queue_mes(dqm, q, qpd);
   if (retval) {
    dev_err(dev, "%s: Failed to add queue %d for dev %d",
     __func__,
     q->properties.queue_id,
     dqm->dev->id);
    return retval;
   }
  }
}

return retval;
}

static int suspend_all_queues_mes(struct device_queue_manager *dqm)
{
struct amdgpu_device *adev = (struct amdgpu_device *)dqm->dev->adev;
int r = 0;

if (!down_read_trylock(&adev->reset_domain->sem))
  return -EIO;

r = amdgpu_mes_suspend(adev);
up_read(&adev->reset_domain->sem);

if (r) {
  dev_err(adev->dev, "failed to suspend gangs from MES\n");
  dev_err(adev->dev, "MES might be in unrecoverable state, issue a GPU reset\n");
  kfd_hws_hang(dqm);
}

return r;
}

static int resume_all_queues_mes(struct device_queue_manager *dqm)
{
struct amdgpu_device *adev = (struct amdgpu_device *)dqm->dev->adev;
int r = 0;

if (!down_read_trylock(&adev->reset_domain->sem))
  return -EIO;

r = amdgpu_mes_resume(adev);
up_read(&adev->reset_domain->sem);

if (r) {
  dev_err(adev->dev, "failed to resume gangs from MES\n");
  dev_err(adev->dev, "MES might be in unrecoverable state, issue a GPU reset\n");
  kfd_hws_hang(dqm);
}

return r;
}

static void increment_queue_count(struct device_queue_manager *dqm,
      struct qcm_process_device *qpd,
      struct queue *q)
{
dqm->active_queue_count++;
if (q->properties.type == KFD_QUEUE_TYPE_COMPUTE ||
     q->properties.type == KFD_QUEUE_TYPE_DIQ)
  dqm->active_cp_queue_count++;

if (q->properties.is_gws) {
  dqm->gws_queue_count++;
  qpd->mapped_gws_queue = true;
}
}

static void decrement_queue_count(struct device_queue_manager *dqm,
      struct qcm_process_device *qpd,
      struct queue *q)
{
dqm->active_queue_count--;
if (q->properties.type == KFD_QUEUE_TYPE_COMPUTE ||
     q->properties.type == KFD_QUEUE_TYPE_DIQ)
  dqm->active_cp_queue_count--;

if (q->properties.is_gws) {
  dqm->gws_queue_count--;
  qpd->mapped_gws_queue = false;
}
}

/*
* Allocate a doorbell ID to this queue.
* If doorbell_id is passed in, make sure requested ID is valid then allocate it.
*/
static int allocate_doorbell(struct qcm_process_device *qpd,
        struct queue *q,
        uint32_t const *restore_id)
{
struct kfd_node *dev = qpd->dqm->dev;

if (!KFD_IS_SOC15(dev)) {
  /* On pre-SOC15 chips we need to use the queue ID to
* preserve the user mode ABI.
*/

  if (restore_id && *restore_id != q->properties.queue_id)
   return -EINVAL;

  q->doorbell_id = q->properties.queue_id;
} else if (q->properties.type == KFD_QUEUE_TYPE_SDMA ||
   q->properties.type == KFD_QUEUE_TYPE_SDMA_XGMI) {
  /* For SDMA queues on SOC15 with 8-byte doorbell, use static
* doorbell assignments based on the engine and queue id.
* The doobell index distance between RLC (2*i) and (2*i+1)
* for a SDMA engine is 512.
*/

  uint32_t *idx_offset = dev->kfd->shared_resources.sdma_doorbell_idx;

  /*
* q->properties.sdma_engine_id corresponds to the virtual
* sdma engine number. However, for doorbell allocation,
* we need the physical sdma engine id in order to get the
* correct doorbell offset.
*/
  uint32_t valid_id = idx_offset[qpd->dqm->dev->node_id *
            get_num_all_sdma_engines(qpd->dqm) +
            q->properties.sdma_engine_id]
      + (q->properties.sdma_queue_id & 1)
      * KFD_QUEUE_DOORBELL_MIRROR_OFFSET
      + (q->properties.sdma_queue_id >> 1);

  if (restore_id && *restore_id != valid_id)
   return -EINVAL;
  q->doorbell_id = valid_id;
} else {
  /* For CP queues on SOC15 */
  if (restore_id) {
   /* make sure that ID is free  */
   if (__test_and_set_bit(*restore_id, qpd->doorbell_bitmap))
    return -EINVAL;

   q->doorbell_id = *restore_id;
  } else {
   /* or reserve a free doorbell ID */
   unsigned int found;

   found = find_first_zero_bit(qpd->doorbell_bitmap,
          KFD_MAX_NUM_OF_QUEUES_PER_PROCESS);
   if (found >= KFD_MAX_NUM_OF_QUEUES_PER_PROCESS) {
    pr_debug("No doorbells available");
    return -EBUSY;
   }
   set_bit(found, qpd->doorbell_bitmap);
   q->doorbell_id = found;
  }
}

q->properties.doorbell_off = amdgpu_doorbell_index_on_bar(dev->adev,
          qpd->proc_doorbells,
          q->doorbell_id,
          dev->kfd->device_info.doorbell_size);
return 0;
}

static void deallocate_doorbell(struct qcm_process_device *qpd,
    struct queue *q)
{
unsigned int old;
struct kfd_node *dev = qpd->dqm->dev;

if (!KFD_IS_SOC15(dev) ||
     q->properties.type == KFD_QUEUE_TYPE_SDMA ||
     q->properties.type == KFD_QUEUE_TYPE_SDMA_XGMI)
  return;

old = test_and_clear_bit(q->doorbell_id, qpd->doorbell_bitmap);
WARN_ON(!old);
}

static void program_trap_handler_settings(struct device_queue_manager *dqm,
    struct qcm_process_device *qpd)
{
uint32_t xcc_mask = dqm->dev->xcc_mask;
int xcc_id;

if (dqm->dev->kfd2kgd->program_trap_handler_settings)
  for_each_inst(xcc_id, xcc_mask)
   dqm->dev->kfd2kgd->program_trap_handler_settings(
    dqm->dev->adev, qpd->vmid, qpd->tba_addr,
    qpd->tma_addr, xcc_id);
}

static int allocate_vmid(struct device_queue_manager *dqm,
   struct qcm_process_device *qpd,
   struct queue *q)
{
struct kfd_process_device *pdd = qpd_to_pdd(qpd);
struct device *dev = dqm->dev->adev->dev;
int allocated_vmid = -1, i;

for (i = dqm->dev->vm_info.first_vmid_kfd;
   i <= dqm->dev->vm_info.last_vmid_kfd; i++) {
  if (!dqm->vmid_pasid[i]) {
   allocated_vmid = i;
   break;
  }
}

if (allocated_vmid < 0) {
  dev_err(dev, "no more vmid to allocate\n");
  return -ENOSPC;
}

pr_debug("vmid allocated: %d\n", allocated_vmid);

dqm->vmid_pasid[allocated_vmid] = pdd->pasid;

set_pasid_vmid_mapping(dqm, pdd->pasid, allocated_vmid);

qpd->vmid = allocated_vmid;
q->properties.vmid = allocated_vmid;

program_sh_mem_settings(dqm, qpd);

if (KFD_IS_SOC15(dqm->dev) && dqm->dev->kfd->cwsr_enabled)
  program_trap_handler_settings(dqm, qpd);

/* qpd->page_table_base is set earlier when register_process()
* is called, i.e. when the first queue is created.
*/
dqm->dev->kfd2kgd->set_vm_context_page_table_base(dqm->dev->adev,
   qpd->vmid,
   qpd->page_table_base);
/* invalidate the VM context after pasid and vmid mapping is set up */
kfd_flush_tlb(qpd_to_pdd(qpd), TLB_FLUSH_LEGACY);

if (dqm->dev->kfd2kgd->set_scratch_backing_va)
  dqm->dev->kfd2kgd->set_scratch_backing_va(dqm->dev->adev,
    qpd->sh_hidden_private_base, qpd->vmid);

return 0;
}

static int flush_texture_cache_nocpsch(struct kfd_node *kdev,
    struct qcm_process_device *qpd)
{
const struct packet_manager_funcs *pmf = qpd->dqm->packet_mgr.pmf;
int ret;

if (!qpd->ib_kaddr)
  return -ENOMEM;

ret = pmf->release_mem(qpd->ib_base, (uint32_t *)qpd->ib_kaddr);
if (ret)
  return ret;

return amdgpu_amdkfd_submit_ib(kdev->adev, KGD_ENGINE_MEC1, qpd->vmid,
    qpd->ib_base, (uint32_t *)qpd->ib_kaddr,
    pmf->release_mem_size / sizeof(uint32_t));
}

static void deallocate_vmid(struct device_queue_manager *dqm,
    struct qcm_process_device *qpd,
    struct queue *q)
{
struct device *dev = dqm->dev->adev->dev;

/* On GFX v7, CP doesn't flush TC at dequeue */
if (q->device->adev->asic_type == CHIP_HAWAII)
  if (flush_texture_cache_nocpsch(q->device, qpd))
   dev_err(dev, "Failed to flush TC\n");

kfd_flush_tlb(qpd_to_pdd(qpd), TLB_FLUSH_LEGACY);

/* Release the vmid mapping */
set_pasid_vmid_mapping(dqm, 0, qpd->vmid);
dqm->vmid_pasid[qpd->vmid] = 0;

qpd->vmid = 0;
q->properties.vmid = 0;
}

static int create_queue_nocpsch(struct device_queue_manager *dqm,
    struct queue *q,
    struct qcm_process_device *qpd,
    const struct kfd_criu_queue_priv_data *qd,
    const void *restore_mqd, const void *restore_ctl_stack)
{
struct mqd_manager *mqd_mgr;
int retval;

dqm_lock(dqm);

if (dqm->total_queue_count >= max_num_of_queues_per_device) {
  pr_warn("Can't create new usermode queue because %d queues were already created\n",
    dqm->total_queue_count);
  retval = -EPERM;
  goto out_unlock;
}

if (list_empty(&qpd->queues_list)) {
  retval = allocate_vmid(dqm, qpd, q);
  if (retval)
   goto out_unlock;
}
q->properties.vmid = qpd->vmid;
/*
* Eviction state logic: mark all queues as evicted, even ones
* not currently active. Restoring inactive queues later only
* updates the is_evicted flag but is a no-op otherwise.
*/
q->properties.is_evicted = !!qpd->evicted;

q->properties.tba_addr = qpd->tba_addr;
q->properties.tma_addr = qpd->tma_addr;

mqd_mgr = dqm->mqd_mgrs[get_mqd_type_from_queue_type(
   q->properties.type)];
if (q->properties.type == KFD_QUEUE_TYPE_COMPUTE) {
  retval = allocate_hqd(dqm, q);
  if (retval)
   goto deallocate_vmid;
  pr_debug("Loading mqd to hqd on pipe %d, queue %d\n",
   q->pipe, q->queue);
} else if (q->properties.type == KFD_QUEUE_TYPE_SDMA ||
  q->properties.type == KFD_QUEUE_TYPE_SDMA_XGMI) {
  retval = allocate_sdma_queue(dqm, q, qd ? &qd->sdma_id : NULL);
  if (retval)
   goto deallocate_vmid;
  dqm->asic_ops.init_sdma_vm(dqm, q, qpd);
}

retval = allocate_doorbell(qpd, q, qd ? &qd->doorbell_id : NULL);
if (retval)
  goto out_deallocate_hqd;

/* Temporarily release dqm lock to avoid a circular lock dependency */
dqm_unlock(dqm);
q->mqd_mem_obj = mqd_mgr->allocate_mqd(mqd_mgr->dev, &q->properties);
dqm_lock(dqm);

if (!q->mqd_mem_obj) {
  retval = -ENOMEM;
  goto out_deallocate_doorbell;
}

if (qd)
  mqd_mgr->restore_mqd(mqd_mgr, &q->mqd, q->mqd_mem_obj, &q->gart_mqd_addr,
         &q->properties, restore_mqd, restore_ctl_stack,
         qd->ctl_stack_size);
else
  mqd_mgr->init_mqd(mqd_mgr, &q->mqd, q->mqd_mem_obj,
     &q->gart_mqd_addr, &q->properties);

if (q->properties.is_active) {
  if (!dqm->sched_running) {
   WARN_ONCE(1, "Load non-HWS mqd while stopped\n");
   goto add_queue_to_list;
  }

  if (WARN(q->process->mm != current->mm,
     "should only run in user thread"))
   retval = -EFAULT;
  else
   retval = mqd_mgr->load_mqd(mqd_mgr, q->mqd, q->pipe,
     q->queue, &q->properties, current->mm);
  if (retval)
   goto out_free_mqd;
}

add_queue_to_list:
list_add(&q->list, &qpd->queues_list);
qpd->queue_count++;
if (q->properties.is_active)
  increment_queue_count(dqm, qpd, q);

/*
* Unconditionally increment this counter, regardless of the queue's
* type or whether the queue is active.
*/
dqm->total_queue_count++;
pr_debug("Total of %d queues are accountable so far\n",
   dqm->total_queue_count);
goto out_unlock;

out_free_mqd:
mqd_mgr->free_mqd(mqd_mgr, q->mqd, q->mqd_mem_obj);
out_deallocate_doorbell:
deallocate_doorbell(qpd, q);
out_deallocate_hqd:
if (q->properties.type == KFD_QUEUE_TYPE_COMPUTE)
  deallocate_hqd(dqm, q);
else if (q->properties.type == KFD_QUEUE_TYPE_SDMA ||
  q->properties.type == KFD_QUEUE_TYPE_SDMA_XGMI)
  deallocate_sdma_queue(dqm, q);
deallocate_vmid:
if (list_empty(&qpd->queues_list))
  deallocate_vmid(dqm, qpd, q);
out_unlock:
dqm_unlock(dqm);
return retval;
}

static int allocate_hqd(struct device_queue_manager *dqm, struct queue *q)
{
bool set;
int pipe, bit, i;

set = false;

for (pipe = dqm->next_pipe_to_allocate, i = 0;
   i < get_pipes_per_mec(dqm);
   pipe = ((pipe + 1) % get_pipes_per_mec(dqm)), ++i) {

  if (!is_pipe_enabled(dqm, 0, pipe))
   continue;

  if (dqm->allocated_queues[pipe] != 0) {
   bit = ffs(dqm->allocated_queues[pipe]) - 1;
   dqm->allocated_queues[pipe] &= ~(1 << bit);
   q->pipe = pipe;
   q->queue = bit;
   set = true;
   break;
  }
}

if (!set)
  return -EBUSY;

pr_debug("hqd slot - pipe %d, queue %d\n", q->pipe, q->queue);
/* horizontal hqd allocation */
dqm->next_pipe_to_allocate = (pipe + 1) % get_pipes_per_mec(dqm);

return 0;
}

static inline void deallocate_hqd(struct device_queue_manager *dqm,
    struct queue *q)
{
dqm->allocated_queues[q->pipe] |= (1 << q->queue);
}

#define SQ_IND_CMD_CMD_KILL  0x00000003
#define SQ_IND_CMD_MODE_BROADCAST 0x00000001

static int dbgdev_wave_reset_wavefronts(struct kfd_node *dev, struct kfd_process *p)
{
int status = 0;
unsigned int vmid;
uint16_t queried_pasid;
union SQ_CMD_BITS reg_sq_cmd;
union GRBM_GFX_INDEX_BITS reg_gfx_index;
struct kfd_process_device *pdd;
int first_vmid_to_scan = dev->vm_info.first_vmid_kfd;
int last_vmid_to_scan = dev->vm_info.last_vmid_kfd;
uint32_t xcc_mask = dev->xcc_mask;
int xcc_id;

reg_sq_cmd.u32All = 0;
reg_gfx_index.u32All = 0;

pr_debug("Killing all process wavefronts\n");

if (!dev->kfd2kgd->get_atc_vmid_pasid_mapping_info) {
  dev_err(dev->adev->dev, "no vmid pasid mapping supported\n");
  return -EOPNOTSUPP;
}

/* taking the VMID for that process on the safe way using PDD */
pdd = kfd_get_process_device_data(dev, p);
if (!pdd)
  return -EFAULT;

/* Scan all registers in the range ATC_VMID8_PASID_MAPPING ..
* ATC_VMID15_PASID_MAPPING
* to check which VMID the current process is mapped to.
*/

for (vmid = first_vmid_to_scan; vmid <= last_vmid_to_scan; vmid++) {
  status = dev->kfd2kgd->get_atc_vmid_pasid_mapping_info
    (dev->adev, vmid, &queried_pasid);

  if (status && queried_pasid == pdd->pasid) {
   pr_debug("Killing wave fronts of vmid %d and process pid %d\n",
     vmid, p->lead_thread->pid);
   break;
  }
}

if (vmid > last_vmid_to_scan) {
  dev_err(dev->adev->dev, "Didn't find vmid for process pid %d\n",
    p->lead_thread->pid);
  return -EFAULT;
}

reg_gfx_index.bits.sh_broadcast_writes = 1;
reg_gfx_index.bits.se_broadcast_writes = 1;
reg_gfx_index.bits.instance_broadcast_writes = 1;
reg_sq_cmd.bits.mode = SQ_IND_CMD_MODE_BROADCAST;
reg_sq_cmd.bits.cmd = SQ_IND_CMD_CMD_KILL;
reg_sq_cmd.bits.vm_id = vmid;

for_each_inst(xcc_id, xcc_mask)
  dev->kfd2kgd->wave_control_execute(
   dev->adev, reg_gfx_index.u32All,
   reg_sq_cmd.u32All, xcc_id);

return 0;
}

/* Access to DQM has to be locked before calling destroy_queue_nocpsch_locked
* to avoid asynchronized access
*/
static int destroy_queue_nocpsch_locked(struct device_queue_manager *dqm,
    struct qcm_process_device *qpd,
    struct queue *q)
{
int retval;
struct mqd_manager *mqd_mgr;

mqd_mgr = dqm->mqd_mgrs[get_mqd_type_from_queue_type(
   q->properties.type)];

if (q->properties.type == KFD_QUEUE_TYPE_COMPUTE)
  deallocate_hqd(dqm, q);
else if (q->properties.type == KFD_QUEUE_TYPE_SDMA)
  deallocate_sdma_queue(dqm, q);
else if (q->properties.type == KFD_QUEUE_TYPE_SDMA_XGMI)
  deallocate_sdma_queue(dqm, q);
else {
  pr_debug("q->properties.type %d is invalid\n",
    q->properties.type);
  return -EINVAL;
}
dqm->total_queue_count--;

deallocate_doorbell(qpd, q);

if (!dqm->sched_running) {
  WARN_ONCE(1, "Destroy non-HWS queue while stopped\n");
  return 0;
}

retval = mqd_mgr->destroy_mqd(mqd_mgr, q->mqd,
    KFD_PREEMPT_TYPE_WAVEFRONT_RESET,
    KFD_UNMAP_LATENCY_MS,
    q->pipe, q->queue);
if (retval == -ETIME)
  qpd->reset_wavefronts = true;

list_del(&q->list);
if (list_empty(&qpd->queues_list)) {
  if (qpd->reset_wavefronts) {
   pr_warn("Resetting wave fronts (nocpsch) on dev %p\n",
     dqm->dev);
   /* dbgdev_wave_reset_wavefronts has to be called before
* deallocate_vmid(), i.e. when vmid is still in use.
*/
   dbgdev_wave_reset_wavefronts(dqm->dev,
     qpd->pqm->process);
   qpd->reset_wavefronts = false;
  }

  deallocate_vmid(dqm, qpd, q);
}
qpd->queue_count--;
if (q->properties.is_active)
  decrement_queue_count(dqm, qpd, q);

return retval;
}

static int destroy_queue_nocpsch(struct device_queue_manager *dqm,
    struct qcm_process_device *qpd,
    struct queue *q)
{
int retval;
uint64_t sdma_val = 0;
struct device *dev = dqm->dev->adev->dev;
struct kfd_process_device *pdd = qpd_to_pdd(qpd);
struct mqd_manager *mqd_mgr =
  dqm->mqd_mgrs[get_mqd_type_from_queue_type(q->properties.type)];

/* Get the SDMA queue stats */
if ((q->properties.type == KFD_QUEUE_TYPE_SDMA) ||
     (q->properties.type == KFD_QUEUE_TYPE_SDMA_XGMI)) {
  retval = read_sdma_queue_counter((uint64_t __user *)q->properties.read_ptr,
       &sdma_val);
  if (retval)
   dev_err(dev, "Failed to read SDMA queue counter for queue: %d\n",
    q->properties.queue_id);
}

dqm_lock(dqm);
retval = destroy_queue_nocpsch_locked(dqm, qpd, q);
if (!retval)
  pdd->sdma_past_activity_counter += sdma_val;
dqm_unlock(dqm);

mqd_mgr->free_mqd(mqd_mgr, q->mqd, q->mqd_mem_obj);

return retval;
}

static int update_queue(struct device_queue_manager *dqm, struct queue *q,
   struct mqd_update_info *minfo)
{
int retval = 0;
struct device *dev = dqm->dev->adev->dev;
struct mqd_manager *mqd_mgr;
struct kfd_process_device *pdd;
bool prev_active = false;

dqm_lock(dqm);
pdd = kfd_get_process_device_data(q->device, q->process);
if (!pdd) {
  retval = -ENODEV;
  goto out_unlock;
}
mqd_mgr = dqm->mqd_mgrs[get_mqd_type_from_queue_type(
   q->properties.type)];

/* Save previous activity state for counters */
prev_active = q->properties.is_active;

/* Make sure the queue is unmapped before updating the MQD */
if (dqm->sched_policy != KFD_SCHED_POLICY_NO_HWS) {
  if (!dqm->dev->kfd->shared_resources.enable_mes)
   retval = unmap_queues_cpsch(dqm,
          KFD_UNMAP_QUEUES_FILTER_DYNAMIC_QUEUES, 0, USE_DEFAULT_GRACE_PERIOD, false);
  else if (prev_active)
   retval = remove_queue_mes(dqm, q, &pdd->qpd);

  /* queue is reset so inaccessable  */
  if (pdd->has_reset_queue) {
   retval = -EACCES;
   goto out_unlock;
  }

  if (retval) {
   dev_err(dev, "unmap queue failed\n");
   goto out_unlock;
  }
} else if (prev_active &&
     (q->properties.type == KFD_QUEUE_TYPE_COMPUTE ||
      q->properties.type == KFD_QUEUE_TYPE_SDMA ||
      q->properties.type == KFD_QUEUE_TYPE_SDMA_XGMI)) {

  if (!dqm->sched_running) {
   WARN_ONCE(1, "Update non-HWS queue while stopped\n");
   goto out_unlock;
  }

  retval = mqd_mgr->destroy_mqd(mqd_mgr, q->mqd,
    (dqm->dev->kfd->cwsr_enabled ?
     KFD_PREEMPT_TYPE_WAVEFRONT_SAVE :
     KFD_PREEMPT_TYPE_WAVEFRONT_DRAIN),
    KFD_UNMAP_LATENCY_MS, q->pipe, q->queue);
  if (retval) {
   dev_err(dev, "destroy mqd failed\n");
   goto out_unlock;
  }
}

mqd_mgr->update_mqd(mqd_mgr, q->mqd, &q->properties, minfo);

/*
* check active state vs. the previous state and modify
* counter accordingly. map_queues_cpsch uses the
* dqm->active_queue_count to determine whether a new runlist must be
* uploaded.
*/
if (q->properties.is_active && !prev_active) {
  increment_queue_count(dqm, &pdd->qpd, q);
} else if (!q->properties.is_active && prev_active) {
  decrement_queue_count(dqm, &pdd->qpd, q);
} else if (q->gws && !q->properties.is_gws) {
  if (q->properties.is_active) {
   dqm->gws_queue_count++;
   pdd->qpd.mapped_gws_queue = true;
  }
  q->properties.is_gws = true;
} else if (!q->gws && q->properties.is_gws) {
  if (q->properties.is_active) {
   dqm->gws_queue_count--;
   pdd->qpd.mapped_gws_queue = false;
  }
  q->properties.is_gws = false;
}

if (dqm->sched_policy != KFD_SCHED_POLICY_NO_HWS) {
  if (!dqm->dev->kfd->shared_resources.enable_mes)
   retval = map_queues_cpsch(dqm);
  else if (q->properties.is_active)
   retval = add_queue_mes(dqm, q, &pdd->qpd);
} else if (q->properties.is_active &&
   (q->properties.type == KFD_QUEUE_TYPE_COMPUTE ||
    q->properties.type == KFD_QUEUE_TYPE_SDMA ||
    q->properties.type == KFD_QUEUE_TYPE_SDMA_XGMI)) {
  if (WARN(q->process->mm != current->mm,
    "should only run in user thread"))
   retval = -EFAULT;
  else
   retval = mqd_mgr->load_mqd(mqd_mgr, q->mqd,
         q->pipe, q->queue,
         &q->properties, current->mm);
}

out_unlock:
dqm_unlock(dqm);
return retval;
}

/* suspend_single_queue does not lock the dqm like the
* evict_process_queues_cpsch or evict_process_queues_nocpsch. You should
* lock the dqm before calling, and unlock after calling.
*
* The reason we don't lock the dqm is because this function may be
* called on multiple queues in a loop, so rather than locking/unlocking
* multiple times, we will just keep the dqm locked for all of the calls.
*/
static int suspend_single_queue(struct device_queue_manager *dqm,
          struct kfd_process_device *pdd,
          struct queue *q)
{
bool is_new;

if (q->properties.is_suspended)
  return 0;

pr_debug("Suspending process pid %d queue [%i]\n",
   pdd->process->lead_thread->pid,
   q->properties.queue_id);

is_new = q->properties.exception_status & KFD_EC_MASK(EC_QUEUE_NEW);

if (is_new || q->properties.is_being_destroyed) {
  pr_debug("Suspend: skip %s queue id %i\n",
    is_new ? "new" : "destroyed",
    q->properties.queue_id);
  return -EBUSY;
}

q->properties.is_suspended = true;
if (q->properties.is_active) {
  if (dqm->dev->kfd->shared_resources.enable_mes) {
   int r = remove_queue_mes(dqm, q, &pdd->qpd);

   if (r)
    return r;
  }

  decrement_queue_count(dqm, &pdd->qpd, q);
  q->properties.is_active = false;
}

return 0;
}

/* resume_single_queue does not lock the dqm like the functions
* restore_process_queues_cpsch or restore_process_queues_nocpsch. You should
* lock the dqm before calling, and unlock after calling.
*
* The reason we don't lock the dqm is because this function may be
* called on multiple queues in a loop, so rather than locking/unlocking
* multiple times, we will just keep the dqm locked for all of the calls.
*/
static int resume_single_queue(struct device_queue_manager *dqm,
          struct qcm_process_device *qpd,
          struct queue *q)
{
struct kfd_process_device *pdd;

if (!q->properties.is_suspended)
  return 0;

pdd = qpd_to_pdd(qpd);

pr_debug("Restoring from suspend process pid %d queue [%i]\n",
       pdd->process->lead_thread->pid,
       q->properties.queue_id);

q->properties.is_suspended = false;

if (QUEUE_IS_ACTIVE(q->properties)) {
  if (dqm->dev->kfd->shared_resources.enable_mes) {
   int r = add_queue_mes(dqm, q, &pdd->qpd);

   if (r)
    return r;
  }

  q->properties.is_active = true;
  increment_queue_count(dqm, qpd, q);
}

return 0;
}

static int evict_process_queues_nocpsch(struct device_queue_manager *dqm,
     struct qcm_process_device *qpd)
{
struct queue *q;
struct mqd_manager *mqd_mgr;
struct kfd_process_device *pdd;
int retval, ret = 0;

dqm_lock(dqm);
if (qpd->evicted++ > 0) /* already evicted, do nothing */
  goto out;

pdd = qpd_to_pdd(qpd);
pr_debug_ratelimited("Evicting process pid %d queues\n",
       pdd->process->lead_thread->pid);

pdd->last_evict_timestamp = get_jiffies_64();
/* Mark all queues as evicted. Deactivate all active queues on
* the qpd.
*/
list_for_each_entry(q, &qpd->queues_list, list) {
  q->properties.is_evicted = true;
  if (!q->properties.is_active)
   continue;

  mqd_mgr = dqm->mqd_mgrs[get_mqd_type_from_queue_type(
    q->properties.type)];
  q->properties.is_active = false;
  decrement_queue_count(dqm, qpd, q);

  if (WARN_ONCE(!dqm->sched_running, "Evict when stopped\n"))
   continue;

  retval = mqd_mgr->destroy_mqd(mqd_mgr, q->mqd,
    (dqm->dev->kfd->cwsr_enabled ?
     KFD_PREEMPT_TYPE_WAVEFRONT_SAVE :
     KFD_PREEMPT_TYPE_WAVEFRONT_DRAIN),
    KFD_UNMAP_LATENCY_MS, q->pipe, q->queue);
  if (retval && !ret)
   /* Return the first error, but keep going to
* maintain a consistent eviction state
*/
   ret = retval;
}

out:
dqm_unlock(dqm);
return ret;
}

static int evict_process_queues_cpsch(struct device_queue_manager *dqm,
          struct qcm_process_device *qpd)
{
struct queue *q;
struct device *dev = dqm->dev->adev->dev;
struct kfd_process_device *pdd;
int retval = 0;

dqm_lock(dqm);
if (qpd->evicted++ > 0) /* already evicted, do nothing */
  goto out;

pdd = qpd_to_pdd(qpd);

/* The debugger creates processes that temporarily have not acquired
* all VMs for all devices and has no VMs itself.
* Skip queue eviction on process eviction.
*/
if (!pdd->drm_priv)
  goto out;

pr_debug_ratelimited("Evicting process pid %d queues\n",
       pdd->process->lead_thread->pid);

if (dqm->dev->kfd->shared_resources.enable_mes) {
  pdd->last_evict_timestamp = get_jiffies_64();
  retval = suspend_all_queues_mes(dqm);
  if (retval) {
   dev_err(dev, "Suspending all queues failed");
   goto out;
  }
}

/* Mark all queues as evicted. Deactivate all active queues on
* the qpd.
*/
list_for_each_entry(q, &qpd->queues_list, list) {
  q->properties.is_evicted = true;
  if (!q->properties.is_active)
   continue;

  q->properties.is_active = false;
  decrement_queue_count(dqm, qpd, q);

  if (dqm->dev->kfd->shared_resources.enable_mes) {
   retval = remove_queue_mes(dqm, q, qpd);
   if (retval) {
    dev_err(dev, "Failed to evict queue %d\n",
     q->properties.queue_id);
    goto out;
   }
  }
}

if (!dqm->dev->kfd->shared_resources.enable_mes) {
  pdd->last_evict_timestamp = get_jiffies_64();
  retval = execute_queues_cpsch(dqm,
           qpd->is_debug ?
           KFD_UNMAP_QUEUES_FILTER_ALL_QUEUES :
           KFD_UNMAP_QUEUES_FILTER_DYNAMIC_QUEUES, 0,
           USE_DEFAULT_GRACE_PERIOD);
} else {
  retval = resume_all_queues_mes(dqm);
  if (retval)
   dev_err(dev, "Resuming all queues failed");
}

out:
dqm_unlock(dqm);
return retval;
}

static int restore_process_queues_nocpsch(struct device_queue_manager *dqm,
       struct qcm_process_device *qpd)
{
struct mm_struct *mm = NULL;
struct queue *q;
struct mqd_manager *mqd_mgr;
struct kfd_process_device *pdd;
uint64_t pd_base;
uint64_t eviction_duration;
int retval, ret = 0;

pdd = qpd_to_pdd(qpd);
/* Retrieve PD base */
pd_base = amdgpu_amdkfd_gpuvm_get_process_page_dir(pdd->drm_priv);

dqm_lock(dqm);
if (WARN_ON_ONCE(!qpd->evicted)) /* already restored, do nothing */
  goto out;
if (qpd->evicted > 1) { /* ref count still > 0, decrement & quit */
  qpd->evicted--;
  goto out;
}

pr_debug_ratelimited("Restoring process pid %d queues\n",
       pdd->process->lead_thread->pid);

/* Update PD Base in QPD */
qpd->page_table_base = pd_base;
pr_debug("Updated PD address to 0x%llx\n", pd_base);

if (!list_empty(&qpd->queues_list)) {
  dqm->dev->kfd2kgd->set_vm_context_page_table_base(
    dqm->dev->adev,
    qpd->vmid,
    qpd->page_table_base);
  kfd_flush_tlb(pdd, TLB_FLUSH_LEGACY);
}

/* Take a safe reference to the mm_struct, which may otherwise
* disappear even while the kfd_process is still referenced.
*/
mm = get_task_mm(pdd->process->lead_thread);
if (!mm) {
  ret = -EFAULT;
  goto out;
}

/* Remove the eviction flags. Activate queues that are not
* inactive for other reasons.
*/
list_for_each_entry(q, &qpd->queues_list, list) {
  q->properties.is_evicted = false;
  if (!QUEUE_IS_ACTIVE(q->properties))
   continue;

  mqd_mgr = dqm->mqd_mgrs[get_mqd_type_from_queue_type(
    q->properties.type)];
  q->properties.is_active = true;
  increment_queue_count(dqm, qpd, q);

  if (WARN_ONCE(!dqm->sched_running, "Restore when stopped\n"))
   continue;

  retval = mqd_mgr->load_mqd(mqd_mgr, q->mqd, q->pipe,
           q->queue, &q->properties, mm);
  if (retval && !ret)
   /* Return the first error, but keep going to
* maintain a consistent eviction state
*/
   ret = retval;
}
qpd->evicted = 0;
eviction_duration = get_jiffies_64() - pdd->last_evict_timestamp;
atomic64_add(eviction_duration, &pdd->evict_duration_counter);
out:
if (mm)
  mmput(mm);
dqm_unlock(dqm);
return ret;
}

static int restore_process_queues_cpsch(struct device_queue_manager *dqm,
     struct qcm_process_device *qpd)
{
struct queue *q;
struct device *dev = dqm->dev->adev->dev;
struct kfd_process_device *pdd;
uint64_t eviction_duration;
int retval = 0;

pdd = qpd_to_pdd(qpd);

dqm_lock(dqm);
if (WARN_ON_ONCE(!qpd->evicted)) /* already restored, do nothing */
  goto out;
if (qpd->evicted > 1) { /* ref count still > 0, decrement & quit */
  qpd->evicted--;
  goto out;
}

/* The debugger creates processes that temporarily have not acquired
* all VMs for all devices and has no VMs itself.
* Skip queue restore on process restore.
*/
if (!pdd->drm_priv)
  goto vm_not_acquired;

pr_debug_ratelimited("Restoring process pid %d queues\n",
       pdd->process->lead_thread->pid);

/* Update PD Base in QPD */
qpd->page_table_base = amdgpu_amdkfd_gpuvm_get_process_page_dir(pdd->drm_priv);
pr_debug("Updated PD address to 0x%llx\n", qpd->page_table_base);

/* activate all active queues on the qpd */
list_for_each_entry(q, &qpd->queues_list, list) {
  q->properties.is_evicted = false;
  if (!QUEUE_IS_ACTIVE(q->properties))
   continue;

  q->properties.is_active = true;
  increment_queue_count(dqm, &pdd->qpd, q);

  if (dqm->dev->kfd->shared_resources.enable_mes) {
   retval = add_queue_mes(dqm, q, qpd);
   if (retval) {
    dev_err(dev, "Failed to restore queue %d\n",
     q->properties.queue_id);
    goto out;
   }
  }
}
if (!dqm->dev->kfd->shared_resources.enable_mes)
  retval = execute_queues_cpsch(dqm,
           KFD_UNMAP_QUEUES_FILTER_DYNAMIC_QUEUES, 0, USE_DEFAULT_GRACE_PERIOD);
eviction_duration = get_jiffies_64() - pdd->last_evict_timestamp;
atomic64_add(eviction_duration, &pdd->evict_duration_counter);
vm_not_acquired:
qpd->evicted = 0;
out:
dqm_unlock(dqm);
return retval;
}

static int register_process(struct device_queue_manager *dqm,
     struct qcm_process_device *qpd)
{
struct device_process_node *n;
struct kfd_process_device *pdd;
uint64_t pd_base;
int retval;

n = kzalloc(sizeof(*n), GFP_KERNEL);
if (!n)
  return -ENOMEM;

n->qpd = qpd;

pdd = qpd_to_pdd(qpd);
/* Retrieve PD base */
pd_base = amdgpu_amdkfd_gpuvm_get_process_page_dir(pdd->drm_priv);

dqm_lock(dqm);
list_add(&n->list, &dqm->queues);

/* Update PD Base in QPD */
qpd->page_table_base = pd_base;
pr_debug("Updated PD address to 0x%llx\n", pd_base);

retval = dqm->asic_ops.update_qpd(dqm, qpd);

dqm->processes_count++;

dqm_unlock(dqm);

/* Outside the DQM lock because under the DQM lock we can't do
* reclaim or take other locks that others hold while reclaiming.
*/
kfd_inc_compute_active(dqm->dev);

return retval;
}

static int unregister_process(struct device_queue_manager *dqm,
     struct qcm_process_device *qpd)
{
int retval;
struct device_process_node *cur, *next;

pr_debug("qpd->queues_list is %s\n",
   list_empty(&qpd->queues_list) ? "empty" : "not empty");

retval = 0;
dqm_lock(dqm);

list_for_each_entry_safe(cur, next, &dqm->queues, list) {
  if (qpd == cur->qpd) {
   list_del(&cur->list);
   kfree(cur);
   dqm->processes_count--;
   goto out;
  }
}
/* qpd not found in dqm list */
retval = 1;
out:
dqm_unlock(dqm);

/* Outside the DQM lock because under the DQM lock we can't do
* reclaim or take other locks that others hold while reclaiming.
*/
if (!retval)
  kfd_dec_compute_active(dqm->dev);

return retval;
}

static int
set_pasid_vmid_mapping(struct device_queue_manager *dqm, u32 pasid,
   unsigned int vmid)
{
uint32_t xcc_mask = dqm->dev->xcc_mask;
int xcc_id, ret;

for_each_inst(xcc_id, xcc_mask) {
  ret = dqm->dev->kfd2kgd->set_pasid_vmid_mapping(
   dqm->dev->adev, pasid, vmid, xcc_id);
  if (ret)
   break;
}

return ret;
}

static void init_interrupts(struct device_queue_manager *dqm)
{
uint32_t xcc_mask = dqm->dev->xcc_mask;
unsigned int i, xcc_id;

for_each_inst(xcc_id, xcc_mask) {
  for (i = 0 ; i < get_pipes_per_mec(dqm) ; i++) {
   if (is_pipe_enabled(dqm, 0, i)) {
    dqm->dev->kfd2kgd->init_interrupts(
     dqm->dev->adev, i, xcc_id);
   }
  }
}
}

static int initialize_nocpsch(struct device_queue_manager *dqm)
{
int pipe, queue;

pr_debug("num of pipes: %d\n", get_pipes_per_mec(dqm));

dqm->allocated_queues = kcalloc(get_pipes_per_mec(dqm),
     sizeof(unsigned int), GFP_KERNEL);
if (!dqm->allocated_queues)
  return -ENOMEM;

mutex_init(&dqm->lock_hidden);
INIT_LIST_HEAD(&dqm->queues);
dqm->active_queue_count = dqm->next_pipe_to_allocate = 0;
dqm->active_cp_queue_count = 0;
dqm->gws_queue_count = 0;

for (pipe = 0; pipe < get_pipes_per_mec(dqm); pipe++) {
  int pipe_offset = pipe * get_queues_per_pipe(dqm);

  for (queue = 0; queue < get_queues_per_pipe(dqm); queue++)
   if (test_bit(pipe_offset + queue,
         dqm->dev->kfd->shared_resources.cp_queue_bitmap))
    dqm->allocated_queues[pipe] |= 1 << queue;
}

memset(dqm->vmid_pasid, 0, sizeof(dqm->vmid_pasid));

init_sdma_bitmaps(dqm);

return 0;
}

static void uninitialize(struct device_queue_manager *dqm)
{
int i;

WARN_ON(dqm->active_queue_count > 0 || dqm->processes_count > 0);

kfree(dqm->allocated_queues);
for (i = 0 ; i < KFD_MQD_TYPE_MAX ; i++)
  kfree(dqm->mqd_mgrs[i]);
mutex_destroy(&dqm->lock_hidden);
}

static int start_nocpsch(struct device_queue_manager *dqm)
{
int r = 0;

pr_info("SW scheduler is used");
init_interrupts(dqm);

if (dqm->dev->adev->asic_type == CHIP_HAWAII)
  r = pm_init(&dqm->packet_mgr, dqm);
if (!r)
  dqm->sched_running = true;

return r;
}

static int stop_nocpsch(struct device_queue_manager *dqm)
{
dqm_lock(dqm);
if (!dqm->sched_running) {
  dqm_unlock(dqm);
  return 0;
}

if (dqm->dev->adev->asic_type == CHIP_HAWAII)
  pm_uninit(&dqm->packet_mgr);
dqm->sched_running = false;
dqm_unlock(dqm);

return 0;
}

static int allocate_sdma_queue(struct device_queue_manager *dqm,
    struct queue *q, const uint32_t *restore_sdma_id)
{
struct device *dev = dqm->dev->adev->dev;
int bit;

if (q->properties.type == KFD_QUEUE_TYPE_SDMA) {
  if (bitmap_empty(dqm->sdma_bitmap, get_num_sdma_queues(dqm))) {
   dev_warn(dev, "No more SDMA queue to allocate (%d total queues)\n",
     get_num_sdma_queues(dqm));
   return -ENOMEM;
  }

  if (restore_sdma_id) {
   /* Re-use existing sdma_id */
   if (!test_bit(*restore_sdma_id, dqm->sdma_bitmap)) {
    dev_err(dev, "SDMA queue already in use\n");
    return -EBUSY;
   }
   clear_bit(*restore_sdma_id, dqm->sdma_bitmap);
   q->sdma_id = *restore_sdma_id;
  } else {
   /* Find first available sdma_id */
   bit = find_first_bit(dqm->sdma_bitmap,
          get_num_sdma_queues(dqm));
   clear_bit(bit, dqm->sdma_bitmap);
   q->sdma_id = bit;
  }

  q->properties.sdma_engine_id =
   q->sdma_id % kfd_get_num_sdma_engines(dqm->dev);
  q->properties.sdma_queue_id = q->sdma_id /
    kfd_get_num_sdma_engines(dqm->dev);
} else if (q->properties.type == KFD_QUEUE_TYPE_SDMA_XGMI) {
  if (bitmap_empty(dqm->xgmi_sdma_bitmap, get_num_xgmi_sdma_queues(dqm))) {
   dev_warn(dev, "No more XGMI SDMA queue to allocate (%d total queues)\n",
     get_num_xgmi_sdma_queues(dqm));
   return -ENOMEM;
  }
  if (restore_sdma_id) {
   /* Re-use existing sdma_id */
   if (!test_bit(*restore_sdma_id, dqm->xgmi_sdma_bitmap)) {
    dev_err(dev, "SDMA queue already in use\n");
    return -EBUSY;
   }
   clear_bit(*restore_sdma_id, dqm->xgmi_sdma_bitmap);
   q->sdma_id = *restore_sdma_id;
  } else {
   bit = find_first_bit(dqm->xgmi_sdma_bitmap,
          get_num_xgmi_sdma_queues(dqm));
   clear_bit(bit, dqm->xgmi_sdma_bitmap);
   q->sdma_id = bit;
  }
  /* sdma_engine_id is sdma id including
* both PCIe-optimized SDMAs and XGMI-
* optimized SDMAs. The calculation below
* assumes the first N engines are always
* PCIe-optimized ones
*/
  q->properties.sdma_engine_id =
   kfd_get_num_sdma_engines(dqm->dev) +
   q->sdma_id % kfd_get_num_xgmi_sdma_engines(dqm->dev);
  q->properties.sdma_queue_id = q->sdma_id /
   kfd_get_num_xgmi_sdma_engines(dqm->dev);
} else if (q->properties.type == KFD_QUEUE_TYPE_SDMA_BY_ENG_ID) {
  int i, num_queues, num_engines, eng_offset = 0, start_engine;
  bool free_bit_found = false, is_xgmi = false;

  if (q->properties.sdma_engine_id < kfd_get_num_sdma_engines(dqm->dev)) {
   num_queues = get_num_sdma_queues(dqm);
   num_engines = kfd_get_num_sdma_engines(dqm->dev);
   q->properties.type = KFD_QUEUE_TYPE_SDMA;
  } else {
   num_queues = get_num_xgmi_sdma_queues(dqm);
   num_engines = kfd_get_num_xgmi_sdma_engines(dqm->dev);
   eng_offset = kfd_get_num_sdma_engines(dqm->dev);
   q->properties.type = KFD_QUEUE_TYPE_SDMA_XGMI;
   is_xgmi = true;
  }

  /* Scan available bit based on target engine ID. */
  start_engine = q->properties.sdma_engine_id - eng_offset;
  for (i = start_engine; i < num_queues; i += num_engines) {

   if (!test_bit(i, is_xgmi ? dqm->xgmi_sdma_bitmap : dqm->sdma_bitmap))
    continue;

   clear_bit(i, is_xgmi ? dqm->xgmi_sdma_bitmap : dqm->sdma_bitmap);
   q->sdma_id = i;
   q->properties.sdma_queue_id = q->sdma_id / num_engines;
   free_bit_found = true;
   break;
  }

  if (!free_bit_found) {
   dev_warn(dev, "No more SDMA queue to allocate for target ID %i (%d total queues)\n",
     q->properties.sdma_engine_id, num_queues);
   return -ENOMEM;
  }
}

pr_debug("SDMA engine id: %d\n", q->properties.sdma_engine_id);
pr_debug("SDMA queue id: %d\n", q->properties.sdma_queue_id);

return 0;
}

static void deallocate_sdma_queue(struct device_queue_manager *dqm,
    struct queue *q)
{
if (q->properties.type == KFD_QUEUE_TYPE_SDMA) {
  if (q->sdma_id >= get_num_sdma_queues(dqm))
   return;
  set_bit(q->sdma_id, dqm->sdma_bitmap);
} else if (q->properties.type == KFD_QUEUE_TYPE_SDMA_XGMI) {
  if (q->sdma_id >= get_num_xgmi_sdma_queues(dqm))
   return;
  set_bit(q->sdma_id, dqm->xgmi_sdma_bitmap);
}
}

/*
* Device Queue Manager implementation for cp scheduler
*/

static int set_sched_resources(struct device_queue_manager *dqm)
{
int i, mec;
struct scheduling_resources res;
struct device *dev = dqm->dev->adev->dev;

res.vmid_mask = dqm->dev->compute_vmid_bitmap;

res.queue_mask = 0;
for (i = 0; i < AMDGPU_MAX_QUEUES; ++i) {
  mec = (i / dqm->dev->kfd->shared_resources.num_queue_per_pipe)
   / dqm->dev->kfd->shared_resources.num_pipe_per_mec;

  if (!test_bit(i, dqm->dev->kfd->shared_resources.cp_queue_bitmap))
   continue;

  /* only acquire queues from the first MEC */
  if (mec > 0)
   continue;

  /* This situation may be hit in the future if a new HW
* generation exposes more than 64 queues. If so, the
* definition of res.queue_mask needs updating
*/
  if (WARN_ON(i >= (sizeof(res.queue_mask)*8))) {
   dev_err(dev, "Invalid queue enabled by amdgpu: %d\n", i);
   break;
  }

  res.queue_mask |= 1ull
   << amdgpu_queue_mask_bit_to_set_resource_bit(
    dqm->dev->adev, i);
}
res.gws_mask = ~0ull;
res.oac_mask = res.gds_heap_base = res.gds_heap_size = 0;

pr_debug("Scheduling resources:\n"
   "vmid mask: 0x%8X\n"
   "queue mask: 0x%8llX\n",
   res.vmid_mask, res.queue_mask);

return pm_send_set_resources(&dqm->packet_mgr, &res);
}

static int initialize_cpsch(struct device_queue_manager *dqm)
{
pr_debug("num of pipes: %d\n", get_pipes_per_mec(dqm));

mutex_init(&dqm->lock_hidden);
INIT_LIST_HEAD(&dqm->queues);
dqm->active_queue_count = dqm->processes_count = 0;
dqm->active_cp_queue_count = 0;
dqm->gws_queue_count = 0;
dqm->active_runlist = false;
dqm->trap_debug_vmid = 0;

init_sdma_bitmaps(dqm);

update_dqm_wait_times(dqm);
return 0;
}

/* halt_cpsch:
* Unmap queues so the schedule doesn't continue remaining jobs in the queue.
* Then set dqm->sched_halt so queues don't map to runlist until unhalt_cpsch
* is called.
*/
static int halt_cpsch(struct device_queue_manager *dqm)
{
int ret = 0;

dqm_lock(dqm);
if (!dqm->sched_running) {
  dqm_unlock(dqm);
  return 0;
}

WARN_ONCE(dqm->sched_halt, "Scheduling is already on halt\n");

if (!dqm->is_hws_hang) {
  if (!dqm->dev->kfd->shared_resources.enable_mes)
   ret = unmap_queues_cpsch(dqm,
       KFD_UNMAP_QUEUES_FILTER_ALL_QUEUES, 0,
    USE_DEFAULT_GRACE_PERIOD, false);
  else
   ret = remove_all_kfd_queues_mes(dqm);
}
dqm->sched_halt = true;
dqm_unlock(dqm);

return ret;
}

/* unhalt_cpsch
* Unset dqm->sched_halt and map queues back to runlist
*/
static int unhalt_cpsch(struct device_queue_manager *dqm)
{
int ret = 0;

dqm_lock(dqm);
if (!dqm->sched_running || !dqm->sched_halt) {
  WARN_ONCE(!dqm->sched_halt, "Scheduling is not on halt.\n");
  dqm_unlock(dqm);
  return 0;
}
dqm->sched_halt = false;
if (!dqm->dev->kfd->shared_resources.enable_mes)
  ret = execute_queues_cpsch(dqm,
        KFD_UNMAP_QUEUES_FILTER_DYNAMIC_QUEUES,
   0, USE_DEFAULT_GRACE_PERIOD);
else
  ret = add_all_kfd_queues_mes(dqm);

dqm_unlock(dqm);

return ret;
}

static int start_cpsch(struct device_queue_manager *dqm)
{
struct device *dev = dqm->dev->adev->dev;
int retval, num_hw_queue_slots;

retval = 0;

dqm_lock(dqm);

if (!dqm->dev->kfd->shared_resources.enable_mes) {
  retval = pm_init(&dqm->packet_mgr, dqm);
  if (retval)
   goto fail_packet_manager_init;

  retval = set_sched_resources(dqm);
  if (retval)
   goto fail_set_sched_resources;
}
pr_debug("Allocating fence memory\n");

/* allocate fence memory on the gart */
retval = kfd_gtt_sa_allocate(dqm->dev, sizeof(*dqm->fence_addr),
     &dqm->fence_mem);

if (retval)
  goto fail_allocate_vidmem;

dqm->fence_addr = (uint64_t *)dqm->fence_mem->cpu_ptr;
dqm->fence_gpu_addr = dqm->fence_mem->gpu_addr;

init_interrupts(dqm);

/* clear hang status when driver try to start the hw scheduler */
dqm->sched_running = true;

if (!dqm->dev->kfd->shared_resources.enable_mes) {
  if (pm_config_dequeue_wait_counts(&dqm->packet_mgr,
    KFD_DEQUEUE_WAIT_INIT, 0 /* unused */))
   dev_err(dev, "Setting optimized dequeue wait failed. Using default values\n");
  execute_queues_cpsch(dqm, KFD_UNMAP_QUEUES_FILTER_DYNAMIC_QUEUES, 0, USE_DEFAULT_GRACE_PERIOD);
}

/* setup per-queue reset detection buffer  */
num_hw_queue_slots =  dqm->dev->kfd->shared_resources.num_queue_per_pipe *
         dqm->dev->kfd->shared_resources.num_pipe_per_mec *
         NUM_XCC(dqm->dev->xcc_mask);

dqm->detect_hang_info_size = num_hw_queue_slots * sizeof(struct dqm_detect_hang_info);
dqm->detect_hang_info = kzalloc(dqm->detect_hang_info_size, GFP_KERNEL);

if (!dqm->detect_hang_info) {
  retval = -ENOMEM;
  goto fail_detect_hang_buffer;
}

dqm_unlock(dqm);

return 0;
fail_detect_hang_buffer:
kfd_gtt_sa_free(dqm->dev, dqm->fence_mem);
fail_allocate_vidmem:
fail_set_sched_resources:
if (!dqm->dev->kfd->shared_resources.enable_mes)
  pm_uninit(&dqm->packet_mgr);
fail_packet_manager_init:
dqm_unlock(dqm);
return retval;
}

static int stop_cpsch(struct device_queue_manager *dqm)
{
dqm_lock(dqm);
if (!dqm->sched_running) {
  dqm_unlock(dqm);
  return 0;
}

if (!dqm->dev->kfd->shared_resources.enable_mes)
  unmap_queues_cpsch(dqm, KFD_UNMAP_QUEUES_FILTER_ALL_QUEUES, 0, USE_DEFAULT_GRACE_PERIOD, false);
else
  remove_all_kfd_queues_mes(dqm);

dqm->sched_running = false;

if (!dqm->dev->kfd->shared_resources.enable_mes)
  pm_release_ib(&dqm->packet_mgr);

kfd_gtt_sa_free(dqm->dev, dqm->fence_mem);
if (!dqm->dev->kfd->shared_resources.enable_mes)
  pm_uninit(&dqm->packet_mgr);
kfree(dqm->detect_hang_info);
dqm->detect_hang_info = NULL;
dqm_unlock(dqm);

return 0;
}

static int create_kernel_queue_cpsch(struct device_queue_manager *dqm,
     struct kernel_queue *kq,
     struct qcm_process_device *qpd)
{
dqm_lock(dqm);
if (dqm->total_queue_count >= max_num_of_queues_per_device) {
  pr_warn("Can't create new kernel queue because %d queues were already created\n",
    dqm->total_queue_count);
  dqm_unlock(dqm);
  return -EPERM;
}

/*
* Unconditionally increment this counter, regardless of the queue's
* type or whether the queue is active.
*/
dqm->total_queue_count++;
pr_debug("Total of %d queues are accountable so far\n",
   dqm->total_queue_count);

list_add(&kq->list, &qpd->priv_queue_list);
increment_queue_count(dqm, qpd, kq->queue);
qpd->is_debug = true;
execute_queues_cpsch(dqm, KFD_UNMAP_QUEUES_FILTER_DYNAMIC_QUEUES, 0,
   USE_DEFAULT_GRACE_PERIOD);
dqm_unlock(dqm);

return 0;
}

static void destroy_kernel_queue_cpsch(struct device_queue_manager *dqm,
     struct kernel_queue *kq,
     struct qcm_process_device *qpd)
{
dqm_lock(dqm);
list_del(&kq->list);
decrement_queue_count(dqm, qpd, kq->queue);
qpd->is_debug = false;
execute_queues_cpsch(dqm, KFD_UNMAP_QUEUES_FILTER_ALL_QUEUES, 0,
   USE_DEFAULT_GRACE_PERIOD);
/*
* Unconditionally decrement this counter, regardless of the queue's
* type.
*/
dqm->total_queue_count--;
pr_debug("Total of %d queues are accountable so far\n",
   dqm->total_queue_count);
dqm_unlock(dqm);
}

static int create_queue_cpsch(struct device_queue_manager *dqm, struct queue *q,
   struct qcm_process_device *qpd,
   const struct kfd_criu_queue_priv_data *qd,
   const void *restore_mqd, const void *restore_ctl_stack)
{
int retval;
struct mqd_manager *mqd_mgr;

if (dqm->total_queue_count >= max_num_of_queues_per_device) {
  pr_warn("Can't create new usermode queue because %d queues were already created\n",
    dqm->total_queue_count);
  retval = -EPERM;
  goto out;
}

if (q->properties.type == KFD_QUEUE_TYPE_SDMA ||
  q->properties.type == KFD_QUEUE_TYPE_SDMA_XGMI ||
  q->properties.type == KFD_QUEUE_TYPE_SDMA_BY_ENG_ID) {
  dqm_lock(dqm);
  retval = allocate_sdma_queue(dqm, q, qd ? &qd->sdma_id : NULL);
  dqm_unlock(dqm);
  if (retval)
   goto out;
}

retval = allocate_doorbell(qpd, q, qd ? &qd->doorbell_id : NULL);
if (retval)
  goto out_deallocate_sdma_queue;

mqd_mgr = dqm->mqd_mgrs[get_mqd_type_from_queue_type(
   q->properties.type)];

if (q->properties.type == KFD_QUEUE_TYPE_SDMA ||
  q->properties.type == KFD_QUEUE_TYPE_SDMA_XGMI)
  dqm->asic_ops.init_sdma_vm(dqm, q, qpd);
q->properties.tba_addr = qpd->tba_addr;
q->properties.tma_addr = qpd->tma_addr;
q->mqd_mem_obj = mqd_mgr->allocate_mqd(mqd_mgr->dev, &q->properties);
if (!q->mqd_mem_obj) {
  retval = -ENOMEM;
  goto out_deallocate_doorbell;
}

dqm_lock(dqm);
/*
* Eviction state logic: mark all queues as evicted, even ones
* not currently active. Restoring inactive queues later only
* updates the is_evicted flag but is a no-op otherwise.
*/
q->properties.is_evicted = !!qpd->evicted;
q->properties.is_dbg_wa = qpd->pqm->process->debug_trap_enabled &&
      kfd_dbg_has_cwsr_workaround(q->device);

if (qd)
  mqd_mgr->restore_mqd(mqd_mgr, &q->mqd, q->mqd_mem_obj, &q->gart_mqd_addr,
         &q->properties, restore_mqd, restore_ctl_stack,
         qd->ctl_stack_size);
else
  mqd_mgr->init_mqd(mqd_mgr, &q->mqd, q->mqd_mem_obj,
     &q->gart_mqd_addr, &q->properties);

list_add(&q->list, &qpd->queues_list);
qpd->queue_count++;

if (q->properties.is_active) {
  increment_queue_count(dqm, qpd, q);

  if (!dqm->dev->kfd->shared_resources.enable_mes)
   retval = execute_queues_cpsch(dqm,
     KFD_UNMAP_QUEUES_FILTER_DYNAMIC_QUEUES, 0, USE_DEFAULT_GRACE_PERIOD);
  else
   retval = add_queue_mes(dqm, q, qpd);
  if (retval)
   goto cleanup_queue;
}

/*
* Unconditionally increment this counter, regardless of the queue's
* type or whether the queue is active.
*/
dqm->total_queue_count++;

pr_debug("Total of %d queues are accountable so far\n",
   dqm->total_queue_count);

dqm_unlock(dqm);
return retval;

cleanup_queue:
qpd->queue_count--;
list_del(&q->list);
if (q->properties.is_active)
  decrement_queue_count(dqm, qpd, q);
mqd_mgr->free_mqd(mqd_mgr, q->mqd, q->mqd_mem_obj);
dqm_unlock(dqm);
out_deallocate_doorbell:
deallocate_doorbell(qpd, q);
out_deallocate_sdma_queue:
if (q->properties.type == KFD_QUEUE_TYPE_SDMA ||
  q->properties.type == KFD_QUEUE_TYPE_SDMA_XGMI) {
  dqm_lock(dqm);
  deallocate_sdma_queue(dqm, q);
  dqm_unlock(dqm);
}
out:
return retval;
}

int amdkfd_fence_wait_timeout(struct device_queue_manager *dqm,
         uint64_t fence_value,
         unsigned int timeout_ms)
{
unsigned long end_jiffies = msecs_to_jiffies(timeout_ms) + jiffies;
struct device *dev = dqm->dev->adev->dev;
uint64_t *fence_addr = dqm->fence_addr;

while (*fence_addr != fence_value) {
  /* Fatal err detected, this response won't come */
  if (amdgpu_amdkfd_is_fed(dqm->dev->adev))
   return -EIO;

  if (time_after(jiffies, end_jiffies)) {
   dev_err(dev, "qcm fence wait loop timeout expired\n");
   /* In HWS case, this is used to halt the driver thread
* in order not to mess up CP states before doing
* scandumps for FW debugging.
*/
   while (halt_if_hws_hang)
    schedule();

   return -ETIME;
  }
  schedule();
}

return 0;
}

/* dqm->lock mutex has to be locked before calling this function */
static int map_queues_cpsch(struct device_queue_manager *dqm)
{
struct device *dev = dqm->dev->adev->dev;
int retval;

if (!dqm->sched_running || dqm->sched_halt)
  return 0;
if (dqm->active_queue_count <= 0 || dqm->processes_count <= 0)
  return 0;
if (dqm->active_runlist)
  return 0;

retval = pm_send_runlist(&dqm->packet_mgr, &dqm->queues);
pr_debug("%s sent runlist\n", __func__);
if (retval) {
  dev_err(dev, "failed to execute runlist\n");
  return retval;
}
dqm->active_runlist = true;

return retval;
}

static void set_queue_as_reset(struct device_queue_manager *dqm, struct queue *q,
          struct qcm_process_device *qpd)
{
struct kfd_process_device *pdd = qpd_to_pdd(qpd);

dev_err(dqm->dev->adev->dev, "queue id 0x%0x at pasid %d is reset\n",
  q->properties.queue_id, pdd->process->lead_thread->pid);

pdd->has_reset_queue = true;
if (q->properties.is_active) {
  q->properties.is_active = false;
  decrement_queue_count(dqm, qpd, q);
}
}

static int detect_queue_hang(struct device_queue_manager *dqm)
{
int i;

/* detect should be used only in dqm locked queue reset */
if (WARN_ON(dqm->detect_hang_count > 0))
  return 0;

memset(dqm->detect_hang_info, 0, dqm->detect_hang_info_size);

for (i = 0; i < AMDGPU_MAX_QUEUES; ++i) {
  uint32_t mec, pipe, queue;
  int xcc_id;

  mec = (i / dqm->dev->kfd->shared_resources.num_queue_per_pipe)
   / dqm->dev->kfd->shared_resources.num_pipe_per_mec;

  if (mec || !test_bit(i, dqm->dev->kfd->shared_resources.cp_queue_bitmap))
   continue;

  amdgpu_queue_mask_bit_to_mec_queue(dqm->dev->adev, i, &mec, &pipe, &queue);

  for_each_inst(xcc_id, dqm->dev->xcc_mask) {
   uint64_t queue_addr = dqm->dev->kfd2kgd->hqd_get_pq_addr(
      dqm->dev->adev, pipe, queue, xcc_id);
   struct dqm_detect_hang_info hang_info;

   if (!queue_addr)
    continue;

   hang_info.pipe_id = pipe;
   hang_info.queue_id = queue;
   hang_info.xcc_id = xcc_id;
   hang_info.queue_address = queue_addr;

   dqm->detect_hang_info[dqm->detect_hang_count] = hang_info;
   dqm->detect_hang_count++;
  }
}

return dqm->detect_hang_count;
}

static struct queue *find_queue_by_address(struct device_queue_manager *dqm, uint64_t queue_address)
{
struct device_process_node *cur;
struct qcm_process_device *qpd;
struct queue *q;

list_for_each_entry(cur, &dqm->queues, list) {
  qpd = cur->qpd;
  list_for_each_entry(q, &qpd->queues_list, list) {
   if (queue_address == q->properties.queue_address)
    return q;
  }
}

return NULL;
}

static int reset_hung_queues(struct device_queue_manager *dqm)
{
int r = 0, reset_count = 0, i;

if (!dqm->detect_hang_info || dqm->is_hws_hang)
  return -EIO;

/* assume dqm locked. */
if (!detect_queue_hang(dqm))
  return -ENOTRECOVERABLE;

for (i = 0; i < dqm->detect_hang_count; i++) {
  struct dqm_detect_hang_info hang_info = dqm->detect_hang_info[i];
  struct queue *q = find_queue_by_address(dqm, hang_info.queue_address);
  struct kfd_process_device *pdd;
  uint64_t queue_addr = 0;

  if (!q) {
   r = -ENOTRECOVERABLE;
   goto reset_fail;
  }

  pdd = kfd_get_process_device_data(dqm->dev, q->process);
  if (!pdd) {
   r = -ENOTRECOVERABLE;
   goto reset_fail;
  }

  queue_addr = dqm->dev->kfd2kgd->hqd_reset(dqm->dev->adev,
    hang_info.pipe_id, hang_info.queue_id, hang_info.xcc_id,
    KFD_UNMAP_LATENCY_MS);

  /* either reset failed or we reset an unexpected queue. */
  if (queue_addr != q->properties.queue_address) {
   r = -ENOTRECOVERABLE;
   goto reset_fail;
  }

  set_queue_as_reset(dqm, q, &pdd->qpd);
  reset_count++;
}

if (reset_count == dqm->detect_hang_count)
  kfd_signal_reset_event(dqm->dev);
else
  r = -ENOTRECOVERABLE;

reset_fail:
dqm->detect_hang_count = 0;

return r;
}

static bool sdma_has_hang(struct device_queue_manager *dqm)
{
int engine_start = dqm->dev->node_id * get_num_all_sdma_engines(dqm);
int engine_end = engine_start + get_num_all_sdma_engines(dqm);
int num_queues_per_eng =  dqm->dev->kfd->device_info.num_sdma_queues_per_engine;
int i, j;

for (i = engine_start; i < engine_end; i++) {
  for (j = 0; j < num_queues_per_eng; j++) {
   if (!dqm->dev->kfd2kgd->hqd_sdma_get_doorbell(dqm->dev->adev, i, j))
    continue;

   return true;
  }
}

return false;
}

static bool set_sdma_queue_as_reset(struct device_queue_manager *dqm,
        uint32_t doorbell_off)
{
struct device_process_node *cur;
struct qcm_process_device *qpd;
struct queue *q;

list_for_each_entry(cur, &dqm->queues, list) {
  qpd = cur->qpd;
  list_for_each_entry(q, &qpd->queues_list, list) {
   if ((q->properties.type == KFD_QUEUE_TYPE_SDMA ||
        q->properties.type == KFD_QUEUE_TYPE_SDMA_XGMI) &&
        q->properties.doorbell_off == doorbell_off) {
    set_queue_as_reset(dqm, q, qpd);
    return true;
   }
  }
}

return false;
}

static int reset_hung_queues_sdma(struct device_queue_manager *dqm)
{
int engine_start = dqm->dev->node_id * get_num_all_sdma_engines(dqm);
int engine_end = engine_start + get_num_all_sdma_engines(dqm);
int num_queues_per_eng =  dqm->dev->kfd->device_info.num_sdma_queues_per_engine;
int r = 0, i, j;

if (dqm->is_hws_hang)
  return -EIO;

/* Scan for hung HW queues and reset engine. */
dqm->detect_hang_count = 0;
for (i = engine_start; i < engine_end; i++) {
  for (j = 0; j < num_queues_per_eng; j++) {
   uint32_t doorbell_off =
    dqm->dev->kfd2kgd->hqd_sdma_get_doorbell(dqm->dev->adev, i, j);

   if (!doorbell_off)
    continue;

   /* Reset engine and check. */
   if (amdgpu_sdma_reset_engine(dqm->dev->adev, i, false) ||
       dqm->dev->kfd2kgd->hqd_sdma_get_doorbell(dqm->dev->adev, i, j) ||
       !set_sdma_queue_as_reset(dqm, doorbell_off)) {
    r = -ENOTRECOVERABLE;
    goto reset_fail;
   }

   /* Should only expect one queue active per engine */
   dqm->detect_hang_count++;
   break;
  }
}

/* Signal process reset */
if (dqm->detect_hang_count)
  kfd_signal_reset_event(dqm->dev);
else
  r = -ENOTRECOVERABLE;

reset_fail:
dqm->detect_hang_count = 0;

return r;
}

static int reset_queues_on_hws_hang(struct device_queue_manager *dqm, bool is_sdma)
{
struct amdgpu_device *adev = dqm->dev->adev;

while (halt_if_hws_hang)
  schedule();

if (adev->debug_disable_gpu_ring_reset) {
  dev_info_once(adev->dev,
         "%s queue hung, but ring reset disabled",
         is_sdma ? "sdma" : "compute");

  return -EPERM;
}
if (!amdgpu_gpu_recovery)
  return -ENOTRECOVERABLE;

return is_sdma ? reset_hung_queues_sdma(dqm) : reset_hung_queues(dqm);
}

/* dqm->lock mutex has to be locked before calling this function
*
--> --------------------

--> maximum size reached

--> --------------------

Messung V0.5

¤ Dauer der Verarbeitung: 0.35 Sekunden (vorverarbeitet) ¤

Wurzel

Suchen

Beweissystem der NASA

Beweissystem Isabelle

NIST Cobol Testsuite

Cephes Mathematical Library

Wiener Entwicklungsmethode

Haftungshinweis

Die Informationen auf dieser Webseite wurden nach bestem Wissen sorgfältig zusammengestellt. Es wird jedoch weder Vollständigkeit, noch Richtigkeit, noch Qualität der bereit gestellten Informationen zugesichert.

Bemerkung:

Die farbliche Syntaxdarstellung und die Messung sind noch experimentell.