From 6ed3cffb73488b22d671c88d30061cd045417378 Mon Sep 17 00:00:00 2001
From: Mahantesh Kumbar <mkumbar@nvidia.com>
Date: Wed, 8 Jun 2016 17:27:49 +0530
Subject: gpu: nvgpu: ACR boot on SEC2

ACR/SEC2 methods to support ACR boot
SEC2 falcon

JIRA DNVGPU-34

Change-Id: I917be1d6c61a1c1ae61a918f50228ea00492cd50
Signed-off-by: Mahantesh Kumbar <mkumbar@nvidia.com>
Reviewed-on: http://git-master/r/1161122
GVS: Gerrit_Virtual_Submit
Reviewed-by: Terje Bergstrom <tbergstrom@nvidia.com>
---
 drivers/gpu/nvgpu/gp106/acr_gp106.c | 1131 +++++++++++++++++++++++++++++++++++
 1 file changed, 1131 insertions(+)
 create mode 100644 drivers/gpu/nvgpu/gp106/acr_gp106.c

(limited to 'drivers/gpu/nvgpu/gp106/acr_gp106.c')

diff --git a/drivers/gpu/nvgpu/gp106/acr_gp106.c b/drivers/gpu/nvgpu/gp106/acr_gp106.c
new file mode 100644
index 00000000..2ea2f817
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp106/acr_gp106.c
@@ -0,0 +1,1131 @@
+/*
+ * Copyright (c) 2015-2016, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ */
+
+#include <linux/delay.h>	/* for mdelay */
+#include <linux/firmware.h>
+#include <linux/clk.h>
+#include <linux/module.h>
+#include <linux/debugfs.h>
+#include <linux/dma-mapping.h>
+#include <linux/io.h>
+
+#include "gk20a/gk20a.h"
+#include "gk20a/pmu_gk20a.h"
+#include "gk20a/semaphore_gk20a.h"
+#include "gm20b/hw_pwr_gm20b.h"
+#include "gm206/acr_gm206.h"
+#include "gm20b/acr_gm20b.h"
+#include "gm206/pmu_gm206.h"
+#include "sec2_gp106.h"
+
+/*Defines*/
+#define gp106_dbg_pmu(fmt, arg...) \
+	gk20a_dbg(gpu_dbg_pmu, fmt, ##arg)
+
+typedef int (*get_ucode_details)(struct gk20a *g,
+		struct flcn_ucode_img_v1 *udata);
+
+/* Both size and address of WPR need to be 128K-aligned */
+#define WPR_ALIGNMENT	0x20000
+#define GP106_DGPU_NONWPR 0x10000000 /* start from 256MB location at VIDMEM */
+#define GP106_DGPU_WPR 0x20000000
+#define DGPU_WPR_SIZE 0x100000
+
+/*Externs*/
+
+/*Forwards*/
+static int pmu_ucode_details(struct gk20a *g, struct flcn_ucode_img_v1 *p_img);
+static int fecs_ucode_details(struct gk20a *g,
+		struct flcn_ucode_img_v1 *p_img);
+static int gpccs_ucode_details(struct gk20a *g,
+		struct flcn_ucode_img_v1 *p_img);
+static int gp106_bootstrap_hs_flcn(struct gk20a *g);
+
+static int lsfm_discover_ucode_images(struct gk20a *g,
+	struct ls_flcn_mgr_v1 *plsfm);
+static int lsfm_add_ucode_img(struct gk20a *g, struct ls_flcn_mgr_v1 *plsfm,
+	struct flcn_ucode_img_v1 *ucode_image, u32 falcon_id);
+static void lsfm_free_ucode_img_res(struct flcn_ucode_img_v1 *p_img);
+static void lsfm_free_nonpmu_ucode_img_res(struct flcn_ucode_img_v1 *p_img);
+static int lsf_gen_wpr_requirements(struct gk20a *g,
+		struct ls_flcn_mgr_v1 *plsfm);
+static void lsfm_init_wpr_contents(struct gk20a *g,
+		struct ls_flcn_mgr_v1 *plsfm, struct mem_desc *nonwpr);
+static void free_acr_resources(struct gk20a *g, struct ls_flcn_mgr_v1 *plsfm);
+static int gp106_pmu_populate_loader_cfg(struct gk20a *g,
+	void *lsfm, u32 *p_bl_gen_desc_size);
+static int gp106_flcn_populate_bl_dmem_desc(struct gk20a *g,
+	void *lsfm, u32 *p_bl_gen_desc_size, u32 falconid);
+static int gp106_prepare_ucode_blob(struct gk20a *g);
+
+/*Globals*/
+static get_ucode_details pmu_acr_supp_ucode_list[] = {
+	pmu_ucode_details,
+	fecs_ucode_details,
+	gpccs_ucode_details,
+};
+
+void gp106_wpr_info(struct gk20a *g, struct wpr_carveout_info *inf)
+{
+	inf->wpr_base = GP106_DGPU_WPR;
+	inf->nonwpr_base = GP106_DGPU_NONWPR;
+	inf->size = DGPU_WPR_SIZE;
+}
+
+static void flcn64_set_dma(struct falc_u64 *dma_addr, u64 value)
+{
+	dma_addr->lo |= u64_lo32(value);
+	dma_addr->hi |= u64_hi32(value);
+}
+
+int gp106_alloc_blob_space(struct gk20a *g,
+		size_t size, struct mem_desc *mem)
+{
+	int err = 0;
+	struct wpr_carveout_info wpr_inf;
+
+	g->ops.pmu.get_wpr(g, &wpr_inf);
+
+	mem->aperture = APERTURE_VIDMEM;
+	mem->sgt = kzalloc(sizeof(*mem->sgt), GFP_KERNEL);
+	if (!mem->sgt) {
+		gk20a_err(dev_from_gk20a(g), "failed to allocate memory\n");
+		return -ENOMEM;
+	}
+
+	err = sg_alloc_table(mem->sgt, 1, GFP_KERNEL);
+	if (err) {
+		gk20a_err(dev_from_gk20a(g), "failed to allocate sg_table\n");
+		goto free_sgt;
+	}
+
+	sg_dma_address(mem->sgt->sgl) = wpr_inf.nonwpr_base;
+
+	return err;
+
+free_sgt:
+	gk20a_free_sgtable(&mem->sgt);
+	return err;
+}
+
+void gp106_init_secure_pmu(struct gpu_ops *gops)
+{
+	gops->pmu.prepare_ucode = gp106_prepare_ucode_blob;
+	gops->pmu.pmu_setup_hw_and_bootstrap = gp106_bootstrap_hs_flcn;
+	gops->pmu.is_lazy_bootstrap = gm206_is_lazy_bootstrap;
+	gops->pmu.is_priv_load = gm206_is_priv_load;
+	gops->pmu.get_wpr = gp106_wpr_info;
+	gops->pmu.alloc_blob_space = gp106_alloc_blob_space;
+	gops->pmu.pmu_populate_loader_cfg = gp106_pmu_populate_loader_cfg;
+	gops->pmu.flcn_populate_bl_dmem_desc = gp106_flcn_populate_bl_dmem_desc;
+	gops->pmu.falcon_wait_for_halt = sec2_wait_for_halt;
+	gops->pmu.falcon_clear_halt_interrupt_status =
+			sec2_clear_halt_interrupt_status;
+	gops->pmu.init_falcon_setup_hw = init_sec2_setup_hw1;
+}
+/* TODO - check if any free blob res needed*/
+
+int pmu_ucode_details(struct gk20a *g, struct flcn_ucode_img_v1 *p_img)
+{
+	const struct firmware *pmu_fw, *pmu_desc, *pmu_sig;
+	struct pmu_gk20a *pmu = &g->pmu;
+	struct lsf_ucode_desc_v1 *lsf_desc;
+	int err;
+
+	gp106_dbg_pmu("requesting PMU ucode in gp106\n");
+	pmu_fw = gk20a_request_firmware(g, GM20B_PMU_UCODE_IMAGE);
+	if (!pmu_fw) {
+		gk20a_err(dev_from_gk20a(g), "failed to load pmu ucode!!");
+		return -ENOENT;
+	}
+	g->acr.pmu_fw = pmu_fw;
+	gp106_dbg_pmu("Loaded PMU ucode in for blob preparation");
+
+	gp106_dbg_pmu("requesting PMU ucode desc in GM20B\n");
+	pmu_desc = gk20a_request_firmware(g, GM20B_PMU_UCODE_DESC);
+	if (!pmu_desc) {
+		gk20a_err(dev_from_gk20a(g), "failed to load pmu ucode desc!!");
+		err = -ENOENT;
+		goto release_img_fw;
+	}
+	pmu_sig = gk20a_request_firmware(g, GM20B_PMU_UCODE_SIG);
+	if (!pmu_sig) {
+		gk20a_err(dev_from_gk20a(g), "failed to load pmu sig!!");
+		err = -ENOENT;
+		goto release_desc;
+	}
+	pmu->desc_v1 = (struct pmu_ucode_desc_v1 *)pmu_desc->data;
+	pmu->ucode_image = (u32 *)pmu_fw->data;
+	g->acr.pmu_desc = pmu_desc;
+
+	err = gk20a_init_pmu(pmu);
+	if (err) {
+		gp106_dbg_pmu("failed to set function pointers\n");
+		goto release_desc;
+	}
+
+	lsf_desc = kzalloc(sizeof(struct lsf_ucode_desc_v1), GFP_KERNEL);
+	if (!lsf_desc) {
+		err = -ENOMEM;
+		goto release_sig;
+	}
+	memcpy(lsf_desc, (void *)pmu_sig->data, sizeof(struct lsf_ucode_desc_v1));
+	lsf_desc->falcon_id = LSF_FALCON_ID_PMU;
+
+	p_img->desc = pmu->desc_v1;
+	p_img->data = pmu->ucode_image;
+	p_img->data_size = pmu->desc_v1->app_start_offset
+						+ pmu->desc_v1->app_size;
+	p_img->fw_ver = NULL;
+	p_img->header = NULL;
+	p_img->lsf_desc = (struct lsf_ucode_desc_v1 *)lsf_desc;
+	gp106_dbg_pmu("requesting PMU ucode in GM20B exit\n");
+
+	release_firmware(pmu_sig);
+	return 0;
+release_sig:
+	release_firmware(pmu_sig);
+release_desc:
+	release_firmware(pmu_desc);
+release_img_fw:
+	release_firmware(pmu_fw);
+	return err;
+}
+
+int fecs_ucode_details(struct gk20a *g, struct flcn_ucode_img_v1 *p_img)
+{
+	struct lsf_ucode_desc_v1 *lsf_desc;
+	const struct firmware *fecs_sig;
+	int err;
+
+	fecs_sig = gk20a_request_firmware(g, GM20B_FECS_UCODE_SIG);
+	if (!fecs_sig) {
+		gk20a_err(dev_from_gk20a(g), "failed to load fecs sig");
+		return -ENOENT;
+	}
+	lsf_desc = kzalloc(sizeof(struct lsf_ucode_desc_v1), GFP_KERNEL);
+	if (!lsf_desc) {
+		err = -ENOMEM;
+		goto rel_sig;
+	}
+	memcpy(lsf_desc, (void *)fecs_sig->data, sizeof(struct lsf_ucode_desc_v1));
+	lsf_desc->falcon_id = LSF_FALCON_ID_FECS;
+
+	p_img->desc = kzalloc(sizeof(struct pmu_ucode_desc_v1), GFP_KERNEL);
+	if (p_img->desc == NULL) {
+		err = -ENOMEM;
+		goto free_lsf_desc;
+	}
+
+	p_img->desc->bootloader_start_offset =
+		g->ctxsw_ucode_info.fecs.boot.offset;
+	p_img->desc->bootloader_size =
+		ALIGN(g->ctxsw_ucode_info.fecs.boot.size, 256);
+	p_img->desc->bootloader_imem_offset =
+		g->ctxsw_ucode_info.fecs.boot_imem_offset;
+	p_img->desc->bootloader_entry_point =
+		g->ctxsw_ucode_info.fecs.boot_entry;
+
+	p_img->desc->image_size =
+		ALIGN(g->ctxsw_ucode_info.fecs.boot.size, 256) +
+		ALIGN(g->ctxsw_ucode_info.fecs.code.size, 256) +
+		ALIGN(g->ctxsw_ucode_info.fecs.data.size, 256);
+	p_img->desc->app_size = ALIGN(g->ctxsw_ucode_info.fecs.code.size, 256) +
+		ALIGN(g->ctxsw_ucode_info.fecs.data.size, 256);
+	p_img->desc->app_start_offset = g->ctxsw_ucode_info.fecs.code.offset;
+	p_img->desc->app_imem_offset = 0;
+	p_img->desc->app_imem_entry = 0;
+	p_img->desc->app_dmem_offset = 0;
+	p_img->desc->app_resident_code_offset = 0;
+	p_img->desc->app_resident_code_size =
+		g->ctxsw_ucode_info.fecs.code.size;
+	p_img->desc->app_resident_data_offset =
+		g->ctxsw_ucode_info.fecs.data.offset -
+		g->ctxsw_ucode_info.fecs.code.offset;
+	p_img->desc->app_resident_data_size =
+		g->ctxsw_ucode_info.fecs.data.size;
+	p_img->data = g->ctxsw_ucode_info.surface_desc.cpu_va;
+	p_img->data_size = p_img->desc->image_size;
+
+	p_img->fw_ver = NULL;
+	p_img->header = NULL;
+	p_img->lsf_desc = (struct lsf_ucode_desc_v1 *)lsf_desc;
+	gp106_dbg_pmu("fecs fw loaded\n");
+	release_firmware(fecs_sig);
+	return 0;
+free_lsf_desc:
+	kfree(lsf_desc);
+rel_sig:
+	release_firmware(fecs_sig);
+	return err;
+}
+int gpccs_ucode_details(struct gk20a *g, struct flcn_ucode_img_v1 *p_img)
+{
+	struct lsf_ucode_desc_v1 *lsf_desc;
+	const struct firmware *gpccs_sig;
+	int err;
+
+	if (g->ops.securegpccs == false)
+		return -ENOENT;
+
+	gpccs_sig = gk20a_request_firmware(g, T18x_GPCCS_UCODE_SIG);
+	if (!gpccs_sig) {
+		gk20a_err(dev_from_gk20a(g), "failed to load gpccs sig");
+		return -ENOENT;
+	}
+	lsf_desc = kzalloc(sizeof(struct lsf_ucode_desc_v1), GFP_KERNEL);
+	if (!lsf_desc) {
+		err = -ENOMEM;
+		goto rel_sig;
+	}
+	memcpy(lsf_desc, (void *)gpccs_sig->data,
+		sizeof(struct lsf_ucode_desc_v1));
+	lsf_desc->falcon_id = LSF_FALCON_ID_GPCCS;
+
+	p_img->desc = kzalloc(sizeof(struct pmu_ucode_desc_v1), GFP_KERNEL);
+	if (p_img->desc == NULL) {
+		err = -ENOMEM;
+		goto free_lsf_desc;
+	}
+
+	p_img->desc->bootloader_start_offset =
+		0;
+	p_img->desc->bootloader_size =
+		ALIGN(g->ctxsw_ucode_info.gpccs.boot.size, 256);
+	p_img->desc->bootloader_imem_offset =
+		g->ctxsw_ucode_info.gpccs.boot_imem_offset;
+	p_img->desc->bootloader_entry_point =
+		g->ctxsw_ucode_info.gpccs.boot_entry;
+
+	p_img->desc->image_size =
+		ALIGN(g->ctxsw_ucode_info.gpccs.boot.size, 256) +
+		ALIGN(g->ctxsw_ucode_info.gpccs.code.size, 256) +
+		ALIGN(g->ctxsw_ucode_info.gpccs.data.size, 256);
+	p_img->desc->app_size = ALIGN(g->ctxsw_ucode_info.gpccs.code.size, 256)
+		+ ALIGN(g->ctxsw_ucode_info.gpccs.data.size, 256);
+	p_img->desc->app_start_offset = p_img->desc->bootloader_size;
+	p_img->desc->app_imem_offset = 0;
+	p_img->desc->app_imem_entry = 0;
+	p_img->desc->app_dmem_offset = 0;
+	p_img->desc->app_resident_code_offset = 0;
+	p_img->desc->app_resident_code_size =
+		ALIGN(g->ctxsw_ucode_info.gpccs.code.size, 256);
+	p_img->desc->app_resident_data_offset =
+		ALIGN(g->ctxsw_ucode_info.gpccs.data.offset, 256) -
+		ALIGN(g->ctxsw_ucode_info.gpccs.code.offset, 256);
+	p_img->desc->app_resident_data_size =
+		ALIGN(g->ctxsw_ucode_info.gpccs.data.size, 256);
+	p_img->data = (u32 *)((u8 *)g->ctxsw_ucode_info.surface_desc.cpu_va +
+		g->ctxsw_ucode_info.gpccs.boot.offset);
+	p_img->data_size = ALIGN(p_img->desc->image_size, 256);
+	p_img->fw_ver = NULL;
+	p_img->header = NULL;
+	p_img->lsf_desc = (struct lsf_ucode_desc_v1 *)lsf_desc;
+	gp106_dbg_pmu("gpccs fw loaded\n");
+	release_firmware(gpccs_sig);
+	return 0;
+free_lsf_desc:
+	kfree(lsf_desc);
+rel_sig:
+	release_firmware(gpccs_sig);
+	return err;
+}
+
+int gp106_prepare_ucode_blob(struct gk20a *g)
+{
+
+	int err;
+	struct ls_flcn_mgr_v1 lsfm_l, *plsfm;
+	struct pmu_gk20a *pmu = &g->pmu;
+	struct wpr_carveout_info wpr_inf;
+
+	if (g->acr.ucode_blob.cpu_va) {
+		/*Recovery case, we do not need to form
+		non WPR blob of ucodes*/
+		err = gk20a_init_pmu(pmu);
+		if (err) {
+			gp106_dbg_pmu("failed to set function pointers\n");
+			return err;
+		}
+		return 0;
+	}
+	plsfm = &lsfm_l;
+	memset((void *)plsfm, 0, sizeof(struct ls_flcn_mgr_v1));
+	gp106_dbg_pmu("fetching GMMU regs\n");
+	gm20b_mm_mmu_vpr_info_fetch(g);
+	gr_gk20a_init_ctxsw_ucode(g);
+
+	if (g->ops.fb.dump_vpr_wpr_info)
+		g->ops.fb.dump_vpr_wpr_info(g);
+
+	g->ops.pmu.get_wpr(g, &wpr_inf);
+	gp106_dbg_pmu("wpr carveout base:%llx\n", (wpr_inf.wpr_base));
+	gp106_dbg_pmu("wpr carveout size :%x\n", (u32)wpr_inf.size);
+
+	/* Discover all managed falcons*/
+	err = lsfm_discover_ucode_images(g, plsfm);
+	gp106_dbg_pmu(" Managed Falcon cnt %d\n", plsfm->managed_flcn_cnt);
+	if (err)
+		goto exit_err;
+
+	if (plsfm->managed_flcn_cnt && !g->acr.ucode_blob.cpu_va) {
+		/* Generate WPR requirements*/
+		err = lsf_gen_wpr_requirements(g, plsfm);
+		if (err)
+			goto exit_err;
+
+		/*Alloc memory to hold ucode blob contents*/
+		err = g->ops.pmu.alloc_blob_space(g, plsfm->wpr_size
+							,&g->acr.ucode_blob);
+		if (err)
+			goto exit_err;
+
+		gp106_dbg_pmu("managed LS falcon %d, WPR size %d bytes.\n",
+			plsfm->managed_flcn_cnt, plsfm->wpr_size);
+
+		lsfm_init_wpr_contents(g, plsfm, &g->acr.ucode_blob);
+	} else {
+		gp106_dbg_pmu("LSFM is managing no falcons.\n");
+	}
+	gp106_dbg_pmu("prepare ucode blob return 0\n");
+	free_acr_resources(g, plsfm);
+
+ exit_err:
+	return err;
+}
+
+static u8 lsfm_falcon_disabled(struct gk20a *g, struct ls_flcn_mgr_v1 *plsfm,
+	u32 falcon_id)
+{
+	return (plsfm->disable_mask >> falcon_id) & 0x1;
+}
+
+/* Discover all managed falcon ucode images */
+static int lsfm_discover_ucode_images(struct gk20a *g,
+	struct ls_flcn_mgr_v1 *plsfm)
+{
+	struct pmu_gk20a *pmu = &g->pmu;
+	struct flcn_ucode_img_v1 ucode_img;
+	u32 falcon_id;
+	u32 i;
+	int status;
+
+	/* LSFM requires a secure PMU, discover it first.*/
+	/* Obtain the PMU ucode image and add it to the list if required*/
+	memset(&ucode_img, 0, sizeof(ucode_img));
+	status = pmu_ucode_details(g, &ucode_img);
+	if (status == 0) {
+		if (ucode_img.lsf_desc != NULL) {
+			/* The falon_id is formed by grabbing the static base
+			 * falon_id from the image and adding the
+			 * engine-designated falcon instance.*/
+			pmu->pmu_mode |= PMU_SECURE_MODE;
+			falcon_id = ucode_img.lsf_desc->falcon_id +
+				ucode_img.flcn_inst;
+
+			if (!lsfm_falcon_disabled(g, plsfm, falcon_id)) {
+				pmu->falcon_id = falcon_id;
+				if (lsfm_add_ucode_img(g, plsfm, &ucode_img,
+					pmu->falcon_id) == 0)
+					pmu->pmu_mode |= PMU_LSFM_MANAGED;
+
+				plsfm->managed_flcn_cnt++;
+			} else {
+				gp106_dbg_pmu("id not managed %d\n",
+					ucode_img.lsf_desc->falcon_id);
+			}
+		}
+
+		/*Free any ucode image resources if not managing this falcon*/
+		if (!(pmu->pmu_mode & PMU_LSFM_MANAGED)) {
+			gp106_dbg_pmu("pmu is not LSFM managed\n");
+			lsfm_free_ucode_img_res(&ucode_img);
+		}
+	}
+
+	/* Enumerate all constructed falcon objects,
+	 as we need the ucode image info and total falcon count.*/
+
+	/*0th index is always PMU which is already handled in earlier
+	if condition*/
+	for (i = 1; i < (MAX_SUPPORTED_LSFM); i++) {
+		memset(&ucode_img, 0, sizeof(ucode_img));
+		if (pmu_acr_supp_ucode_list[i](g, &ucode_img) == 0) {
+			if (ucode_img.lsf_desc != NULL) {
+				/* We have engine sigs, ensure that this falcon
+				is aware of the secure mode expectations
+				(ACR status)*/
+
+				/* falon_id is formed by grabbing the static
+				base falonId from the image and adding the
+				engine-designated falcon instance. */
+				falcon_id = ucode_img.lsf_desc->falcon_id +
+					ucode_img.flcn_inst;
+
+				if (!lsfm_falcon_disabled(g, plsfm,
+					falcon_id)) {
+					/* Do not manage non-FB ucode*/
+					if (lsfm_add_ucode_img(g,
+						plsfm, &ucode_img, falcon_id)
+						== 0)
+						plsfm->managed_flcn_cnt++;
+				} else {
+					gp106_dbg_pmu("not managed %d\n",
+						ucode_img.lsf_desc->falcon_id);
+					lsfm_free_nonpmu_ucode_img_res(
+						&ucode_img);
+				}
+			}
+		} else {
+			/* Consumed all available falcon objects */
+			gp106_dbg_pmu("Done checking for ucodes %d\n", i);
+			break;
+		}
+	}
+	return 0;
+}
+
+
+static int gp106_pmu_populate_loader_cfg(struct gk20a *g,
+	void *lsfm, u32 *p_bl_gen_desc_size)
+{
+	struct wpr_carveout_info wpr_inf;
+	struct pmu_gk20a *pmu = &g->pmu;
+	struct lsfm_managed_ucode_img_v2 *p_lsfm =
+		(struct lsfm_managed_ucode_img_v2 *)lsfm;
+	struct flcn_ucode_img_v1 *p_img = &(p_lsfm->ucode_img);
+	struct loader_config_v1 *ldr_cfg =
+			&(p_lsfm->bl_gen_desc.loader_cfg_v1);
+	u64 addr_base;
+	struct pmu_ucode_desc_v1 *desc;
+	u64 addr_code, addr_data;
+	u32 addr_args;
+
+	if (p_img->desc == NULL) /*This means its a header based ucode,
+				  and so we do not fill BL gen desc structure*/
+		return -EINVAL;
+	desc = p_img->desc;
+	/*
+	 Calculate physical and virtual addresses for various portions of
+	 the PMU ucode image
+	 Calculate the 32-bit addresses for the application code, application
+	 data, and bootloader code. These values are all based on IM_BASE.
+	 The 32-bit addresses will be the upper 32-bits of the virtual or
+	 physical addresses of each respective segment.
+	*/
+	addr_base = p_lsfm->lsb_header.ucode_off;
+	g->ops.pmu.get_wpr(g, &wpr_inf);
+	addr_base += (wpr_inf.wpr_base);
+
+	gp106_dbg_pmu("pmu loader cfg u32 addrbase %x\n", (u32)addr_base);
+	/*From linux*/
+	addr_code = u64_lo32((addr_base +
+				desc->app_start_offset +
+				desc->app_resident_code_offset) );
+	gp106_dbg_pmu("app start %d app res code off %d\n",
+		desc->app_start_offset, desc->app_resident_code_offset);
+	addr_data = u64_lo32((addr_base +
+				desc->app_start_offset +
+				desc->app_resident_data_offset) );
+	gp106_dbg_pmu("app res data offset%d\n",
+		desc->app_resident_data_offset);
+	gp106_dbg_pmu("bl start off %d\n", desc->bootloader_start_offset);
+
+	addr_args = ((pwr_falcon_hwcfg_dmem_size_v(
+			gk20a_readl(g, pwr_falcon_hwcfg_r())))
+			<< GK20A_PMU_DMEM_BLKSIZE2);
+
+	addr_args -= g->ops.pmu_ver.get_pmu_cmdline_args_size(pmu);
+
+	gp106_dbg_pmu("addr_args %x\n", addr_args);
+
+	/* Populate the loader_config state*/
+	ldr_cfg->dma_idx = GK20A_PMU_DMAIDX_UCODE;
+	flcn64_set_dma(&ldr_cfg->code_dma_base, addr_code);
+	ldr_cfg->code_size_total = desc->app_size;
+	ldr_cfg->code_size_to_load = desc->app_resident_code_size;
+	ldr_cfg->code_entry_point = desc->app_imem_entry;
+	flcn64_set_dma(&ldr_cfg->data_dma_base, addr_data);
+	ldr_cfg->data_size = desc->app_resident_data_size;
+	flcn64_set_dma(&ldr_cfg->overlay_dma_base, addr_code);
+
+	/* Update the argc/argv members*/
+	ldr_cfg->argc = 1;
+	ldr_cfg->argv = addr_args;
+
+	*p_bl_gen_desc_size = sizeof(struct loader_config_v1);
+	g->acr.pmu_args = addr_args;
+	return 0;
+}
+
+static int gp106_flcn_populate_bl_dmem_desc(struct gk20a *g,
+	void *lsfm, u32 *p_bl_gen_desc_size, u32 falconid)
+{
+	struct wpr_carveout_info wpr_inf;
+	struct lsfm_managed_ucode_img_v2 *p_lsfm =
+			(struct lsfm_managed_ucode_img_v2 *)lsfm;
+	struct flcn_ucode_img_v1 *p_img = &(p_lsfm->ucode_img);
+	struct flcn_bl_dmem_desc_v1 *ldr_cfg =
+			&(p_lsfm->bl_gen_desc.bl_dmem_desc_v1);
+	u64 addr_base;
+	struct pmu_ucode_desc_v1 *desc;
+	u64 addr_code, addr_data;
+
+	if (p_img->desc == NULL) /*This means its a header based ucode,
+				  and so we do not fill BL gen desc structure*/
+		return -EINVAL;
+	desc = p_img->desc;
+
+	/*
+	 Calculate physical and virtual addresses for various portions of
+	 the PMU ucode image
+	 Calculate the 32-bit addresses for the application code, application
+	 data, and bootloader code. These values are all based on IM_BASE.
+	 The 32-bit addresses will be the upper 32-bits of the virtual or
+	 physical addresses of each respective segment.
+	*/
+	addr_base = p_lsfm->lsb_header.ucode_off;
+	g->ops.pmu.get_wpr(g, &wpr_inf);
+	addr_base += (wpr_inf.wpr_base);
+
+	gp106_dbg_pmu("gen loader cfg %x u32 addrbase %x ID\n", (u32)addr_base,
+			p_lsfm->wpr_header.falcon_id);
+	addr_code = u64_lo32((addr_base +
+				desc->app_start_offset +
+				desc->app_resident_code_offset) );
+	addr_data = u64_lo32((addr_base +
+				desc->app_start_offset +
+				desc->app_resident_data_offset) );
+
+	gp106_dbg_pmu("gen cfg %x u32 addrcode %x & data %x load offset %xID\n",
+			(u32)addr_code, (u32)addr_data, desc->bootloader_start_offset,
+			p_lsfm->wpr_header.falcon_id);
+
+	/* Populate the LOADER_CONFIG state */
+	memset((void *) ldr_cfg, 0, sizeof(struct flcn_bl_dmem_desc_v1));
+	ldr_cfg->ctx_dma = GK20A_PMU_DMAIDX_UCODE;
+	flcn64_set_dma(&ldr_cfg->code_dma_base, addr_code);
+	ldr_cfg->non_sec_code_size = desc->app_resident_code_size;
+	flcn64_set_dma(&ldr_cfg->data_dma_base, addr_data);
+	ldr_cfg->data_size = desc->app_resident_data_size;
+	ldr_cfg->code_entry_point = desc->app_imem_entry;
+
+	*p_bl_gen_desc_size = sizeof(struct flcn_bl_dmem_desc_v1);
+	return 0;
+}
+
+/* Populate falcon boot loader generic desc.*/
+static int lsfm_fill_flcn_bl_gen_desc(struct gk20a *g,
+		struct lsfm_managed_ucode_img_v2 *pnode)
+{
+
+	struct pmu_gk20a *pmu = &g->pmu;
+	if (pnode->wpr_header.falcon_id != pmu->falcon_id) {
+		gp106_dbg_pmu("non pmu. write flcn bl gen desc\n");
+		g->ops.pmu.flcn_populate_bl_dmem_desc(g,
+				pnode, &pnode->bl_gen_desc_size,
+					pnode->wpr_header.falcon_id);
+		return 0;
+	}
+
+	if (pmu->pmu_mode & PMU_LSFM_MANAGED) {
+		gp106_dbg_pmu("pmu write flcn bl gen desc\n");
+		if (pnode->wpr_header.falcon_id == pmu->falcon_id)
+			return g->ops.pmu.pmu_populate_loader_cfg(g, pnode,
+				&pnode->bl_gen_desc_size);
+	}
+
+	/* Failed to find the falcon requested. */
+	return -ENOENT;
+}
+
+/* Initialize WPR contents */
+static void lsfm_init_wpr_contents(struct gk20a *g,
+		struct ls_flcn_mgr_v1 *plsfm, struct mem_desc *ucode)
+{
+	struct lsfm_managed_ucode_img_v2 *pnode = plsfm->ucode_img_list;
+	u32 i;
+
+	/* The WPR array is at the base of the WPR */
+	pnode = plsfm->ucode_img_list;
+	i = 0;
+
+	/*
+	 * Walk the managed falcons, flush WPR and LSB headers to FB.
+	 * flush any bl args to the storage area relative to the
+	 * ucode image (appended on the end as a DMEM area).
+	 */
+	while (pnode) {
+		/* Flush WPR header to memory*/
+		gk20a_mem_wr_n(g, ucode, i * sizeof(pnode->wpr_header),
+				&pnode->wpr_header, sizeof(pnode->wpr_header));
+
+		gp106_dbg_pmu("wpr header");
+		gp106_dbg_pmu("falconid :%d",
+				pnode->wpr_header.falcon_id);
+		gp106_dbg_pmu("lsb_offset :%x",
+				pnode->wpr_header.lsb_offset);
+		gp106_dbg_pmu("bootstrap_owner :%d",
+			pnode->wpr_header.bootstrap_owner);
+		gp106_dbg_pmu("lazy_bootstrap :%d",
+				pnode->wpr_header.lazy_bootstrap);
+		gp106_dbg_pmu("status :%d",
+				pnode->wpr_header.status);
+
+		/*Flush LSB header to memory*/
+		gk20a_mem_wr_n(g, ucode, pnode->wpr_header.lsb_offset,
+				&pnode->lsb_header, sizeof(pnode->lsb_header));
+
+		gp106_dbg_pmu("lsb header");
+		gp106_dbg_pmu("ucode_off :%x",
+				pnode->lsb_header.ucode_off);
+		gp106_dbg_pmu("ucode_size :%x",
+				pnode->lsb_header.ucode_size);
+		gp106_dbg_pmu("data_size :%x",
+				pnode->lsb_header.data_size);
+		gp106_dbg_pmu("bl_code_size :%x",
+				pnode->lsb_header.bl_code_size);
+		gp106_dbg_pmu("bl_imem_off :%x",
+				pnode->lsb_header.bl_imem_off);
+		gp106_dbg_pmu("bl_data_off :%x",
+				pnode->lsb_header.bl_data_off);
+		gp106_dbg_pmu("bl_data_size :%x",
+				pnode->lsb_header.bl_data_size);
+		gp106_dbg_pmu("app_code_off :%x",
+				pnode->lsb_header.app_code_off);
+		gp106_dbg_pmu("app_code_size :%x",
+				pnode->lsb_header.app_code_size);
+		gp106_dbg_pmu("app_data_off :%x",
+				pnode->lsb_header.app_data_off);
+		gp106_dbg_pmu("app_data_size :%x",
+				pnode->lsb_header.app_data_size);
+		gp106_dbg_pmu("flags :%x",
+				pnode->lsb_header.flags);
+
+		/*If this falcon has a boot loader and related args,
+		 * flush them.*/
+		if (!pnode->ucode_img.header) {
+			/*Populate gen bl and flush to memory*/
+			lsfm_fill_flcn_bl_gen_desc(g, pnode);
+			gk20a_mem_wr_n(g, ucode,
+					pnode->lsb_header.bl_data_off,
+					&pnode->bl_gen_desc,
+					pnode->bl_gen_desc_size);
+		}
+		/*Copying of ucode*/
+		gk20a_mem_wr_n(g, ucode, pnode->lsb_header.ucode_off,
+				pnode->ucode_img.data,
+				pnode->ucode_img.data_size);
+		pnode = pnode->next;
+		i++;
+	}
+
+	/* Tag the terminator WPR header with an invalid falcon ID. */
+	gk20a_mem_wr32(g, ucode,
+			plsfm->managed_flcn_cnt * sizeof(struct lsf_wpr_header) +
+			offsetof(struct lsf_wpr_header, falcon_id),
+			LSF_FALCON_ID_INVALID);
+}
+
+/*!
+ * lsfm_parse_no_loader_ucode: parses UCODE header of falcon
+ *
+ * @param[in] p_ucodehdr : UCODE header
+ * @param[out] lsb_hdr : updates values in LSB header
+ *
+ * @return 0
+ */
+static int lsfm_parse_no_loader_ucode(u32 *p_ucodehdr,
+	struct lsf_lsb_header_v1 *lsb_hdr)
+{
+
+	u32 code_size = 0;
+	u32 data_size = 0;
+	u32 i = 0;
+	u32 total_apps = p_ucodehdr[FLCN_NL_UCODE_HDR_NUM_APPS_IND];
+
+	/* Lets calculate code size*/
+	code_size += p_ucodehdr[FLCN_NL_UCODE_HDR_OS_CODE_SIZE_IND];
+	for (i = 0; i < total_apps; i++) {
+		code_size += p_ucodehdr[FLCN_NL_UCODE_HDR_APP_CODE_SIZE_IND
+			(total_apps, i)];
+	}
+	code_size += p_ucodehdr[FLCN_NL_UCODE_HDR_OS_OVL_SIZE_IND(total_apps)];
+
+	/* Calculate data size*/
+	data_size += p_ucodehdr[FLCN_NL_UCODE_HDR_OS_DATA_SIZE_IND];
+	for (i = 0; i < total_apps; i++) {
+		data_size += p_ucodehdr[FLCN_NL_UCODE_HDR_APP_DATA_SIZE_IND
+			(total_apps, i)];
+	}
+
+	lsb_hdr->ucode_size = code_size;
+	lsb_hdr->data_size = data_size;
+	lsb_hdr->bl_code_size = p_ucodehdr[FLCN_NL_UCODE_HDR_OS_CODE_SIZE_IND];
+	lsb_hdr->bl_imem_off = 0;
+	lsb_hdr->bl_data_off = p_ucodehdr[FLCN_NL_UCODE_HDR_OS_DATA_OFF_IND];
+	lsb_hdr->bl_data_size = p_ucodehdr[FLCN_NL_UCODE_HDR_OS_DATA_SIZE_IND];
+	return 0;
+}
+
+/*!
+ * @brief lsfm_fill_static_lsb_hdr_info
+ * Populate static LSB header infomation using the provided ucode image
+ */
+static void lsfm_fill_static_lsb_hdr_info(struct gk20a *g,
+	u32 falcon_id, struct lsfm_managed_ucode_img_v2 *pnode)
+{
+
+	struct pmu_gk20a *pmu = &g->pmu;
+	u32 full_app_size = 0;
+	u32 data = 0;
+
+	if (pnode->ucode_img.lsf_desc)
+		memcpy(&pnode->lsb_header.signature, pnode->ucode_img.lsf_desc,
+			sizeof(struct lsf_ucode_desc_v1));
+	pnode->lsb_header.ucode_size = pnode->ucode_img.data_size;
+
+	/* The remainder of the LSB depends on the loader usage */
+	if (pnode->ucode_img.header) {
+		/* Does not use a loader */
+		pnode->lsb_header.data_size = 0;
+		pnode->lsb_header.bl_code_size = 0;
+		pnode->lsb_header.bl_data_off = 0;
+		pnode->lsb_header.bl_data_size = 0;
+
+		lsfm_parse_no_loader_ucode(pnode->ucode_img.header,
+			&(pnode->lsb_header));
+
+		/* Load the first 256 bytes of IMEM. */
+		/* Set LOAD_CODE_AT_0 and DMACTL_REQ_CTX.
+		True for all method based falcons */
+		data = NV_FLCN_ACR_LSF_FLAG_LOAD_CODE_AT_0_TRUE |
+			NV_FLCN_ACR_LSF_FLAG_DMACTL_REQ_CTX_TRUE;
+		pnode->lsb_header.flags = data;
+	} else {
+		/* Uses a loader. that is has a desc */
+		pnode->lsb_header.data_size = 0;
+
+		/* The loader code size is already aligned (padded) such that
+		the code following it is aligned, but the size in the image
+		desc is not, bloat it up to be on a 256 byte alignment. */
+		pnode->lsb_header.bl_code_size = ALIGN(
+			pnode->ucode_img.desc->bootloader_size,
+			LSF_BL_CODE_SIZE_ALIGNMENT);
+		full_app_size = ALIGN(pnode->ucode_img.desc->app_size,
+			LSF_BL_CODE_SIZE_ALIGNMENT) +
+			pnode->lsb_header.bl_code_size;
+		pnode->lsb_header.ucode_size = ALIGN(
+			pnode->ucode_img.desc->app_resident_data_offset,
+			LSF_BL_CODE_SIZE_ALIGNMENT) +
+			pnode->lsb_header.bl_code_size;
+		pnode->lsb_header.data_size = full_app_size -
+			pnode->lsb_header.ucode_size;
+		/* Though the BL is located at 0th offset of the image, the VA
+		is different to make sure that it doesnt collide the actual OS
+		VA range */
+		pnode->lsb_header.bl_imem_off =
+			pnode->ucode_img.desc->bootloader_imem_offset;
+
+		/* TODO: OBJFLCN should export properties using which the below
+			flags should be populated.*/
+		pnode->lsb_header.flags = 0;
+
+		if (falcon_id == pmu->falcon_id) {
+			data = NV_FLCN_ACR_LSF_FLAG_DMACTL_REQ_CTX_TRUE;
+			pnode->lsb_header.flags = data;
+		}
+
+		if(g->ops.pmu.is_priv_load(falcon_id))
+			pnode->lsb_header.flags |=
+				NV_FLCN_ACR_LSF_FLAG_FORCE_PRIV_LOAD_TRUE;
+	}
+}
+
+/* Adds a ucode image to the list of managed ucode images managed. */
+static int lsfm_add_ucode_img(struct gk20a *g, struct ls_flcn_mgr_v1 *plsfm,
+	struct flcn_ucode_img_v1 *ucode_image, u32 falcon_id)
+{
+	struct lsfm_managed_ucode_img_v2 *pnode;
+
+	pnode = kzalloc(sizeof(struct lsfm_managed_ucode_img_v2), GFP_KERNEL);
+	if (pnode == NULL)
+		return -ENOMEM;
+
+	/* Keep a copy of the ucode image info locally */
+	memcpy(&pnode->ucode_img, ucode_image, sizeof(struct flcn_ucode_img_v1));
+
+	/* Fill in static WPR header info*/
+	pnode->wpr_header.falcon_id = falcon_id;
+	pnode->wpr_header.bootstrap_owner = 0x07; //LSF_BOOTSTRAP_OWNER_DEFAULT;
+	pnode->wpr_header.status = LSF_IMAGE_STATUS_COPY;
+
+	pnode->wpr_header.lazy_bootstrap =
+			g->ops.pmu.is_lazy_bootstrap(falcon_id);
+
+	/*TODO to check if PDB_PROP_FLCN_LAZY_BOOTSTRAP is to be supported by
+	Android */
+	/* Fill in static LSB header info elsewhere */
+	lsfm_fill_static_lsb_hdr_info(g, falcon_id, pnode);
+	pnode->wpr_header.bin_version = pnode->lsb_header.signature.version;
+	pnode->next = plsfm->ucode_img_list;
+	plsfm->ucode_img_list = pnode;
+	return 0;
+}
+
+/* Free any ucode image structure resources*/
+static void lsfm_free_ucode_img_res(struct flcn_ucode_img_v1 *p_img)
+{
+	if (p_img->lsf_desc != NULL) {
+		kfree(p_img->lsf_desc);
+		p_img->lsf_desc = NULL;
+	}
+}
+
+/* Free any ucode image structure resources*/
+static void lsfm_free_nonpmu_ucode_img_res(struct flcn_ucode_img_v1 *p_img)
+{
+	if (p_img->lsf_desc != NULL) {
+		kfree(p_img->lsf_desc);
+		p_img->lsf_desc = NULL;
+	}
+	if (p_img->desc != NULL) {
+		kfree(p_img->desc);
+		p_img->desc = NULL;
+	}
+}
+
+static void free_acr_resources(struct gk20a *g, struct ls_flcn_mgr_v1 *plsfm)
+{
+	u32 cnt = plsfm->managed_flcn_cnt;
+	struct lsfm_managed_ucode_img_v2 *mg_ucode_img;
+
+	while (cnt) {
+		mg_ucode_img = plsfm->ucode_img_list;
+		if (mg_ucode_img->ucode_img.lsf_desc->falcon_id ==
+				LSF_FALCON_ID_PMU)
+			lsfm_free_ucode_img_res(&mg_ucode_img->ucode_img);
+		else
+			lsfm_free_nonpmu_ucode_img_res(
+				&mg_ucode_img->ucode_img);
+		plsfm->ucode_img_list = mg_ucode_img->next;
+		kfree(mg_ucode_img);
+		cnt--;
+	}
+}
+
+/* Generate WPR requirements for ACR allocation request */
+static int lsf_gen_wpr_requirements(struct gk20a *g,
+		struct ls_flcn_mgr_v1 *plsfm)
+{
+	struct lsfm_managed_ucode_img_v2 *pnode = plsfm->ucode_img_list;
+	u32 wpr_offset;
+
+	/* Calculate WPR size required */
+
+	/* Start with an array of WPR headers at the base of the WPR.
+	 The expectation here is that the secure falcon will do a single DMA
+	 read of this array and cache it internally so it's OK to pack these.
+	 Also, we add 1 to the falcon count to indicate the end of the array.*/
+	wpr_offset = sizeof(struct lsf_wpr_header_v1) *
+		(plsfm->managed_flcn_cnt+1);
+
+	/* Walk the managed falcons, accounting for the LSB structs
+	as well as the ucode images. */
+	while (pnode) {
+		/* Align, save off, and include an LSB header size */
+		wpr_offset = ALIGN(wpr_offset,
+			LSF_LSB_HEADER_ALIGNMENT);
+		pnode->wpr_header.lsb_offset = wpr_offset;
+		wpr_offset += sizeof(struct lsf_lsb_header_v1);
+
+		/* Align, save off, and include the original (static)
+		ucode image size */
+		wpr_offset = ALIGN(wpr_offset,
+			LSF_UCODE_DATA_ALIGNMENT);
+		pnode->lsb_header.ucode_off = wpr_offset;
+		wpr_offset += pnode->ucode_img.data_size;
+
+		/* For falcons that use a boot loader (BL), we append a loader
+		desc structure on the end of the ucode image and consider this
+		the boot loader data. The host will then copy the loader desc
+		args to this space within the WPR region (before locking down)
+		and the HS bin will then copy them to DMEM 0 for the loader. */
+		if (!pnode->ucode_img.header) {
+			/* Track the size for LSB details filled in later
+			 Note that at this point we don't know what kind of i
+			boot loader desc, so we just take the size of the
+			generic one, which is the largest it will will ever be.
+			*/
+			/* Align (size bloat) and save off generic
+			descriptor size*/
+			pnode->lsb_header.bl_data_size = ALIGN(
+				sizeof(pnode->bl_gen_desc),
+				LSF_BL_DATA_SIZE_ALIGNMENT);
+
+			/*Align, save off, and include the additional BL data*/
+			wpr_offset = ALIGN(wpr_offset,
+				LSF_BL_DATA_ALIGNMENT);
+			pnode->lsb_header.bl_data_off = wpr_offset;
+			wpr_offset += pnode->lsb_header.bl_data_size;
+		} else {
+			/* bl_data_off is already assigned in static
+			information. But that is from start of the image */
+			pnode->lsb_header.bl_data_off +=
+				(wpr_offset - pnode->ucode_img.data_size);
+		}
+
+		/* Finally, update ucode surface size to include updates */
+		pnode->full_ucode_size = wpr_offset -
+			pnode->lsb_header.ucode_off;
+		if (pnode->wpr_header.falcon_id != LSF_FALCON_ID_PMU) {
+			pnode->lsb_header.app_code_off =
+				pnode->lsb_header.bl_code_size;
+			pnode->lsb_header.app_code_size =
+				pnode->lsb_header.ucode_size -
+				pnode->lsb_header.bl_code_size;
+			pnode->lsb_header.app_data_off =
+				pnode->lsb_header.ucode_size;
+			pnode->lsb_header.app_data_size =
+				pnode->lsb_header.data_size;
+		}
+		pnode = pnode->next;
+	}
+	plsfm->wpr_size = wpr_offset;
+	return 0;
+}
+
+/*Loads ACR bin to FB mem and bootstraps PMU with bootloader code
+ * start and end are addresses of ucode blob in non-WPR region*/
+int gp106_bootstrap_hs_flcn(struct gk20a *g)
+{
+	struct mm_gk20a *mm = &g->mm;
+	struct vm_gk20a *vm = &mm->pmu.vm;
+	int err = 0;
+	u64 *acr_dmem;
+	u32 img_size_in_bytes = 0;
+	u32 status;
+	struct acr_desc *acr = &g->acr;
+	const struct firmware *acr_fw = acr->acr_fw;
+	struct flcn_bl_dmem_desc_v1 *bl_dmem_desc = &acr->bl_dmem_desc_v1;
+	u32 *acr_ucode_header_t210_load;
+	u32 *acr_ucode_data_t210_load;
+	struct wpr_carveout_info wpr_inf;
+
+	gp106_dbg_pmu("");
+
+	if (!acr_fw) {
+		/*First time init case*/
+		acr_fw = gk20a_request_firmware(g, GM20B_HSBIN_PMU_UCODE_IMAGE);
+		if (!acr_fw) {
+			gk20a_err(dev_from_gk20a(g), "pmu ucode get fail");
+			return -ENOENT;
+		}
+		acr->acr_fw = acr_fw;
+		acr->hsbin_hdr = (struct bin_hdr *)acr_fw->data;
+		acr->fw_hdr = (struct acr_fw_header *)(acr_fw->data +
+				acr->hsbin_hdr->header_offset);
+		acr_ucode_data_t210_load = (u32 *)(acr_fw->data +
+				acr->hsbin_hdr->data_offset);
+		acr_ucode_header_t210_load = (u32 *)(acr_fw->data +
+				acr->fw_hdr->hdr_offset);
+		img_size_in_bytes = ALIGN((acr->hsbin_hdr->data_size), 256);
+
+		/* Lets patch the signatures first.. */
+		if (acr_ucode_patch_sig(g, acr_ucode_data_t210_load,
+					(u32 *)(acr_fw->data +
+						acr->fw_hdr->sig_prod_offset),
+					(u32 *)(acr_fw->data +
+						acr->fw_hdr->sig_dbg_offset),
+					(u32 *)(acr_fw->data +
+						acr->fw_hdr->patch_loc),
+					(u32 *)(acr_fw->data +
+						acr->fw_hdr->patch_sig)) < 0) {
+			gk20a_err(dev_from_gk20a(g), "patch signatures fail");
+			err = -1;
+			goto err_release_acr_fw;
+		}
+		err = gk20a_gmmu_alloc_map(vm, img_size_in_bytes,
+				&acr->acr_ucode);
+		if (err) {
+			err = -ENOMEM;
+			goto err_release_acr_fw;
+		}
+
+		g->ops.pmu.get_wpr(g, &wpr_inf);
+
+		acr_dmem = (u64 *)
+			&(((u8 *)acr_ucode_data_t210_load)[
+					acr_ucode_header_t210_load[2]]);
+		acr->acr_dmem_desc_v1 = (struct flcn_acr_desc_v1 *)((u8 *)(
+			acr->acr_ucode.cpu_va) + acr_ucode_header_t210_load[2]);
+		((struct flcn_acr_desc_v1 *)acr_dmem)->nonwpr_ucode_blob_start =
+				wpr_inf.nonwpr_base;
+		((struct flcn_acr_desc_v1 *)acr_dmem)->nonwpr_ucode_blob_size =
+				wpr_inf.size;
+		((struct flcn_acr_desc_v1 *)acr_dmem)->regions.no_regions = 1;
+		((struct flcn_acr_desc_v1 *)acr_dmem)->wpr_offset = 0;
+
+		((struct flcn_acr_desc_v1 *)acr_dmem)->wpr_region_id = 1;
+		((struct flcn_acr_desc_v1 *)acr_dmem)->regions.region_props[
+											0].region_id = 1;
+		((struct flcn_acr_desc_v1 *)acr_dmem)->regions.region_props[
+			0].start_addr = (wpr_inf.wpr_base ) >> 8;
+		((struct flcn_acr_desc_v1 *)acr_dmem)->regions.region_props[
+			0].end_addr = ((wpr_inf.wpr_base) + wpr_inf.size) >> 8;
+		((struct flcn_acr_desc_v1 *)acr_dmem)->regions.region_props[
+			0].shadowmMem_startaddress = wpr_inf.nonwpr_base >> 8;
+
+		gk20a_mem_wr_n(g, &acr->acr_ucode, 0,
+				acr_ucode_data_t210_load, img_size_in_bytes);
+
+		/*
+		 * In order to execute this binary, we will be using
+		 * a bootloader which will load this image into PMU IMEM/DMEM.
+		 * Fill up the bootloader descriptor for PMU HAL to use..
+		 * TODO: Use standard descriptor which the generic bootloader is
+		 * checked in.
+		 */
+
+		bl_dmem_desc->signature[0] = 0;
+		bl_dmem_desc->signature[1] = 0;
+		bl_dmem_desc->signature[2] = 0;
+		bl_dmem_desc->signature[3] = 0;
+		bl_dmem_desc->ctx_dma = GK20A_PMU_DMAIDX_VIRT;
+		flcn64_set_dma( &bl_dmem_desc->code_dma_base,
+						acr->acr_ucode.gpu_va);
+		bl_dmem_desc->non_sec_code_off  = acr_ucode_header_t210_load[0];
+		bl_dmem_desc->non_sec_code_size = acr_ucode_header_t210_load[1];
+		bl_dmem_desc->sec_code_off = acr_ucode_header_t210_load[5];
+		bl_dmem_desc->sec_code_size = acr_ucode_header_t210_load[6];
+		bl_dmem_desc->code_entry_point = 0; /* Start at 0th offset */
+		flcn64_set_dma( &bl_dmem_desc->data_dma_base,
+					acr->acr_ucode.gpu_va +
+					(acr_ucode_header_t210_load[2]));
+		bl_dmem_desc->data_size = acr_ucode_header_t210_load[3];
+	} else
+		acr->acr_dmem_desc->nonwpr_ucode_blob_size = 0;
+
+	status = pmu_exec_gen_bl(g, bl_dmem_desc, 1);
+	if (status != 0) {
+		err = status;
+		goto err_free_ucode_map;
+	}
+	return 0;
+err_free_ucode_map:
+	gk20a_gmmu_unmap_free(vm, &acr->acr_ucode);
+err_release_acr_fw:
+	release_firmware(acr_fw);
+	acr->acr_fw = NULL;
+	return err;
+}
-- 
cgit v1.2.2