11 files changed, 2676 insertions, 0 deletions
diff --git a/drivers/video/tegra/host/host1x/Makefile b/drivers/video/tegra/host/host1x/Makefile
new file mode 100644
index 00000000000..c3214ffe147
--- /dev/null
+++ b/drivers/video/tegra/host/host1x/Makefile
@@ -0,0 +1,12 @@
+GCOV_PROFILE := y
+EXTRA_CFLAGS += -Idrivers/video/tegra/host
+nvhost-host1x-objs  = \
+        host1x_syncpt.o \
+        host1x_channel.o \
+        host1x_intr.o \
+        host1x_cdma.o \
+        host1x_debug.o
+obj-$(CONFIG_TEGRA_GRHOST) += nvhost-host1x.o
diff --git a/drivers/video/tegra/host/host1x/host1x_cdma.c b/drivers/video/tegra/host/host1x/host1x_cdma.c
new file mode 100644
index 00000000000..cdd6026718b
--- /dev/null
+++ b/drivers/video/tegra/host/host1x/host1x_cdma.c
@@ -0,0 +1,665 @@
+/*
+ * drivers/video/tegra/host/host1x/host1x_cdma.c
+ *
+ * Tegra Graphics Host Command DMA
+ *
+ * Copyright (c) 2010-2012, NVIDIA Corporation.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+#include <linux/slab.h>
+#include "nvhost_cdma.h"
+#include "dev.h"
+#include "host1x_hardware.h"
+#include "host1x_syncpt.h"
+#include "host1x_cdma.h"
+#include "host1x_hwctx.h"
+static inline u32 host1x_channel_dmactrl(int stop, int get_rst, int init_get)
+{
+        return HOST1X_CREATE(CHANNEL_DMACTRL, DMASTOP, stop)
+                        | HOST1X_CREATE(CHANNEL_DMACTRL, DMAGETRST, get_rst)
+                        | HOST1X_CREATE(CHANNEL_DMACTRL, DMAINITGET, init_get);
+}
+static void cdma_timeout_handler(struct work_struct *work);
+/*
+ * push_buffer
+ *
+ * The push buffer is a circular array of words to be fetched by command DMA.
+ * Note that it works slightly differently to the sync queue; fence == cur
+ * means that the push buffer is full, not empty.
+ */
+/**
+ * Reset to empty push buffer
+ */
+static void push_buffer_reset(struct push_buffer *pb)
+{
+        pb->fence = PUSH_BUFFER_SIZE - 8;
+        pb->cur = 0;
+}
+/**
+ * Init push buffer resources
+ */
+static int push_buffer_init(struct push_buffer *pb)
+{
+        struct nvhost_cdma *cdma = pb_to_cdma(pb);
+        struct nvmap_client *nvmap = cdma_to_nvmap(cdma);
+        pb->mem = NULL;
+        pb->mapped = NULL;
+        pb->phys = 0;
+        pb->nvmap = NULL;
+        BUG_ON(!cdma_pb_op(cdma).reset);
+        cdma_pb_op(cdma).reset(pb);
+        /* allocate and map pushbuffer memory */
+        pb->mem = nvmap_alloc(nvmap, PUSH_BUFFER_SIZE + 4, 32,
+                              NVMAP_HANDLE_WRITE_COMBINE, 0);
+        if (IS_ERR_OR_NULL(pb->mem)) {
+                pb->mem = NULL;
+                goto fail;
+        }
+        pb->mapped = nvmap_mmap(pb->mem);
+        if (pb->mapped == NULL)
+                goto fail;
+        /* pin pushbuffer and get physical address */
+        pb->phys = nvmap_pin(nvmap, pb->mem);
+        if (pb->phys >= 0xfffff000) {
+                pb->phys = 0;
+                goto fail;
+        }
+        /* memory for storing nvmap client and handles for each opcode pair */
+        pb->nvmap = kzalloc(NVHOST_GATHER_QUEUE_SIZE *
+                                sizeof(struct nvmap_client_handle),
+                        GFP_KERNEL);
+        if (!pb->nvmap)
+                goto fail;
+        /* put the restart at the end of pushbuffer memory */
+        *(pb->mapped + (PUSH_BUFFER_SIZE >> 2)) =
+                nvhost_opcode_restart(pb->phys);
+        return 0;
+fail:
+        cdma_pb_op(cdma).destroy(pb);
+        return -ENOMEM;
+}
+/**
+ * Clean up push buffer resources
+ */
+static void push_buffer_destroy(struct push_buffer *pb)
+{
+        struct nvhost_cdma *cdma = pb_to_cdma(pb);
+        struct nvmap_client *nvmap = cdma_to_nvmap(cdma);
+        if (pb->mapped)
+                nvmap_munmap(pb->mem, pb->mapped);
+        if (pb->phys != 0)
+                nvmap_unpin(nvmap, pb->mem);
+        if (pb->mem)
+                nvmap_free(nvmap, pb->mem);
+        kfree(pb->nvmap);
+        pb->mem = NULL;
+        pb->mapped = NULL;
+        pb->phys = 0;
+        pb->nvmap = 0;
+}
+/**
+ * Push two words to the push buffer
+ * Caller must ensure push buffer is not full
+ */
+static void push_buffer_push_to(struct push_buffer *pb,
+                struct nvmap_client *client,
+                struct nvmap_handle *handle, u32 op1, u32 op2)
+{
+        u32 cur = pb->cur;
+        u32 *p = (u32 *)((u32)pb->mapped + cur);
+        u32 cur_nvmap = (cur/8) & (NVHOST_GATHER_QUEUE_SIZE - 1);
+        BUG_ON(cur == pb->fence);
+        *(p++) = op1;
+        *(p++) = op2;
+        pb->nvmap[cur_nvmap].client = client;
+        pb->nvmap[cur_nvmap].handle = handle;
+        pb->cur = (cur + 8) & (PUSH_BUFFER_SIZE - 1);
+}
+/**
+ * Pop a number of two word slots from the push buffer
+ * Caller must ensure push buffer is not empty
+ */
+static void push_buffer_pop_from(struct push_buffer *pb,
+                unsigned int slots)
+{
+        /* Clear the nvmap references for old items from pb */
+        unsigned int i;
+        u32 fence_nvmap = pb->fence/8;
+        for (i = 0; i < slots; i++) {
+                int cur_fence_nvmap = (fence_nvmap+i)
+                                & (NVHOST_GATHER_QUEUE_SIZE - 1);
+                struct nvmap_client_handle *h =
+                                &pb->nvmap[cur_fence_nvmap];
+                h->client = NULL;
+                h->handle = NULL;
+        }
+        /* Advance the next write position */
+        pb->fence = (pb->fence + slots * 8) & (PUSH_BUFFER_SIZE - 1);
+}
+/**
+ * Return the number of two word slots free in the push buffer
+ */
+static u32 push_buffer_space(struct push_buffer *pb)
+{
+        return ((pb->fence - pb->cur) & (PUSH_BUFFER_SIZE - 1)) / 8;
+}
+static u32 push_buffer_putptr(struct push_buffer *pb)
+{
+        return pb->phys + pb->cur;
+}
+/*
+ * The syncpt incr buffer is filled with methods to increment syncpts, which
+ * is later GATHER-ed into the mainline PB. It's used when a timed out context
+ * is interleaved with other work, so needs to inline the syncpt increments
+ * to maintain the count (but otherwise does no work).
+ */
+/**
+ * Init timeout and syncpt incr buffer resources
+ */
+static int cdma_timeout_init(struct nvhost_cdma *cdma,
+                                 u32 syncpt_id)
+{
+        struct nvhost_master *dev = cdma_to_dev(cdma);
+        struct nvmap_client *nvmap = cdma_to_nvmap(cdma);
+        struct syncpt_buffer *sb = &cdma->syncpt_buffer;
+        struct nvhost_channel *ch = cdma_to_channel(cdma);
+        u32 i = 0;
+        if (syncpt_id == NVSYNCPT_INVALID)
+                return -EINVAL;
+        /* allocate and map syncpt incr memory */
+        sb->mem = nvmap_alloc(nvmap,
+                        (SYNCPT_INCR_BUFFER_SIZE_WORDS * sizeof(u32)), 32,
+                        NVMAP_HANDLE_WRITE_COMBINE, 0);
+        if (IS_ERR_OR_NULL(sb->mem)) {
+                sb->mem = NULL;
+                goto fail;
+        }
+        sb->mapped = nvmap_mmap(sb->mem);
+        if (sb->mapped == NULL)
+                goto fail;
+        /* pin syncpt buffer and get physical address */
+        sb->phys = nvmap_pin(nvmap, sb->mem);
+        if (sb->phys >= 0xfffff000) {
+                sb->phys = 0;
+                goto fail;
+        }
+        dev_dbg(&dev->dev->dev, "%s: SYNCPT_INCR buffer at 0x%x\n",
+                 __func__, sb->phys);
+        sb->words_per_incr = (syncpt_id == NVSYNCPT_3D) ? 5 : 3;
+        sb->incr_per_buffer = (SYNCPT_INCR_BUFFER_SIZE_WORDS /
+                                sb->words_per_incr);
+        /* init buffer with SETCL and INCR_SYNCPT methods */
+        while (i < sb->incr_per_buffer) {
+                sb->mapped[i++] = nvhost_opcode_setclass(NV_HOST1X_CLASS_ID,
+                                                0, 0);
+                sb->mapped[i++] = nvhost_opcode_imm_incr_syncpt(
+                                                NV_SYNCPT_IMMEDIATE,
+                                                syncpt_id);
+                if (syncpt_id == NVSYNCPT_3D) {
+                        /* also contains base increments */
+                        sb->mapped[i++] = nvhost_opcode_nonincr(
+                                                NV_CLASS_HOST_INCR_SYNCPT_BASE,
+                                                1);
+                        sb->mapped[i++] = nvhost_class_host_incr_syncpt_base(
+                                                NVWAITBASE_3D, 1);
+                }
+                sb->mapped[i++] = nvhost_opcode_setclass(ch->dev->class,
+                                                0, 0);
+        }
+        wmb();
+        INIT_DELAYED_WORK(&cdma->timeout.wq, cdma_timeout_handler);
+        cdma->timeout.initialized = true;
+        return 0;
+fail:
+        cdma_op(cdma).timeout_destroy(cdma);
+        return -ENOMEM;
+}
+/**
+ * Clean up timeout syncpt buffer resources
+ */
+static void cdma_timeout_destroy(struct nvhost_cdma *cdma)
+{
+        struct nvmap_client *nvmap = cdma_to_nvmap(cdma);
+        struct syncpt_buffer *sb = &cdma->syncpt_buffer;
+        if (sb->mapped)
+                nvmap_munmap(sb->mem, sb->mapped);
+        if (sb->phys != 0)
+                nvmap_unpin(nvmap, sb->mem);
+        if (sb->mem)
+                nvmap_free(nvmap, sb->mem);
+        sb->mem = NULL;
+        sb->mapped = NULL;
+        sb->phys = 0;
+        if (cdma->timeout.initialized)
+                cancel_delayed_work(&cdma->timeout.wq);
+        cdma->timeout.initialized = false;
+}
+/**
+ * Increment timedout buffer's syncpt via CPU.
+ */
+static void cdma_timeout_cpu_incr(struct nvhost_cdma *cdma, u32 getptr,
+                                u32 syncpt_incrs, u32 syncval, u32 nr_slots)
+{
+        struct nvhost_master *dev = cdma_to_dev(cdma);
+        struct push_buffer *pb = &cdma->push_buffer;
+        u32 i, getidx;
+        for (i = 0; i < syncpt_incrs; i++)
+                nvhost_syncpt_cpu_incr(&dev->syncpt, cdma->timeout.syncpt_id);
+        /* after CPU incr, ensure shadow is up to date */
+        nvhost_syncpt_update_min(&dev->syncpt, cdma->timeout.syncpt_id);
+        /* update WAITBASE_3D by same number of incrs */
+        if (cdma->timeout.syncpt_id == NVSYNCPT_3D) {
+                void __iomem *p;
+                p = dev->sync_aperture + HOST1X_SYNC_SYNCPT_BASE_0 +
+                                (NVWAITBASE_3D * sizeof(u32));
+                writel(syncval, p);
+        }
+        /* NOP all the PB slots */
+        getidx = getptr - pb->phys;
+        while (nr_slots--) {
+                u32 *p = (u32 *)((u32)pb->mapped + getidx);
+                *(p++) = NVHOST_OPCODE_NOOP;
+                *(p++) = NVHOST_OPCODE_NOOP;
+                dev_dbg(&dev->dev->dev, "%s: NOP at 0x%x\n",
+                        __func__, pb->phys + getidx);
+                getidx = (getidx + 8) & (PUSH_BUFFER_SIZE - 1);
+        }
+        wmb();
+}
+/**
+ * This routine is called at the point we transition back into a timed
+ * ctx. The syncpts are incremented via pushbuffer with a flag indicating
+ * whether there's a CTXSAVE that should be still executed (for the
+ * preceding HW ctx).
+ */
+static void cdma_timeout_pb_incr(struct nvhost_cdma *cdma, u32 getptr,
+                                u32 syncpt_incrs, u32 nr_slots,
+                                bool exec_ctxsave)
+{
+        struct nvhost_master *dev = cdma_to_dev(cdma);
+        struct syncpt_buffer *sb = &cdma->syncpt_buffer;
+        struct push_buffer *pb = &cdma->push_buffer;
+        struct host1x_hwctx *hwctx = to_host1x_hwctx(cdma->timeout.ctx);
+        u32 getidx, *p;
+        /* should have enough slots to incr to desired count */
+        BUG_ON(syncpt_incrs > (nr_slots * sb->incr_per_buffer));
+        getidx = getptr - pb->phys;
+        if (exec_ctxsave) {
+                /* don't disrupt the CTXSAVE of a good/non-timed out ctx */
+                nr_slots -= hwctx->save_slots;
+                syncpt_incrs -= hwctx->save_incrs;
+                getidx += (hwctx->save_slots * 8);
+                getidx &= (PUSH_BUFFER_SIZE - 1);
+                dev_dbg(&dev->dev->dev,
+                        "%s: exec CTXSAVE of prev ctx (slots %d, incrs %d)\n",
+                        __func__, nr_slots, syncpt_incrs);
+        }
+        while (syncpt_incrs) {
+                u32 incrs, count;
+                /* GATHER count are incrs * number of DWORDs per incr */
+                incrs = min(syncpt_incrs, sb->incr_per_buffer);
+                count = incrs * sb->words_per_incr;
+                p = (u32 *)((u32)pb->mapped + getidx);
+                *(p++) = nvhost_opcode_gather(count);
+                *(p++) = sb->phys;
+                dev_dbg(&dev->dev->dev,
+                        "%s: GATHER at 0x%x, from 0x%x, dcount = %d\n",
+                        __func__,
+                        pb->phys + getidx, sb->phys,
+                        (incrs * sb->words_per_incr));
+                syncpt_incrs -= incrs;
+                getidx = (getidx + 8) & (PUSH_BUFFER_SIZE - 1);
+                nr_slots--;
+        }
+        /* NOP remaining slots */
+        while (nr_slots--) {
+                p = (u32 *)((u32)pb->mapped + getidx);
+                *(p++) = NVHOST_OPCODE_NOOP;
+                *(p++) = NVHOST_OPCODE_NOOP;
+                dev_dbg(&dev->dev->dev, "%s: NOP at 0x%x\n",
+                        __func__, pb->phys + getidx);
+                getidx = (getidx + 8) & (PUSH_BUFFER_SIZE - 1);
+        }
+        wmb();
+}
+/**
+ * Start channel DMA
+ */
+static void cdma_start(struct nvhost_cdma *cdma)
+{
+        void __iomem *chan_regs = cdma_to_channel(cdma)->aperture;
+        if (cdma->running)
+                return;
+        BUG_ON(!cdma_pb_op(cdma).putptr);
+        cdma->last_put = cdma_pb_op(cdma).putptr(&cdma->push_buffer);
+        writel(host1x_channel_dmactrl(true, false, false),
+                chan_regs + HOST1X_CHANNEL_DMACTRL);
+        /* set base, put, end pointer (all of memory) */
+        writel(0, chan_regs + HOST1X_CHANNEL_DMASTART);
+        writel(cdma->last_put, chan_regs + HOST1X_CHANNEL_DMAPUT);
+        writel(0xFFFFFFFF, chan_regs + HOST1X_CHANNEL_DMAEND);
+        /* reset GET */
+        writel(host1x_channel_dmactrl(true, true, true),
+                chan_regs + HOST1X_CHANNEL_DMACTRL);
+        /* start the command DMA */
+        writel(host1x_channel_dmactrl(false, false, false),
+                chan_regs + HOST1X_CHANNEL_DMACTRL);
+        cdma->running = true;
+}
+/**
+ * Similar to cdma_start(), but rather than starting from an idle
+ * state (where DMA GET is set to DMA PUT), on a timeout we restore
+ * DMA GET from an explicit value (so DMA may again be pending).
+ */
+static void cdma_timeout_restart(struct nvhost_cdma *cdma, u32 getptr)
+{
+        struct nvhost_master *dev = cdma_to_dev(cdma);
+        void __iomem *chan_regs = cdma_to_channel(cdma)->aperture;
+        if (cdma->running)
+                return;
+        BUG_ON(!cdma_pb_op(cdma).putptr);
+        cdma->last_put = cdma_pb_op(cdma).putptr(&cdma->push_buffer);
+        writel(host1x_channel_dmactrl(true, false, false),
+                chan_regs + HOST1X_CHANNEL_DMACTRL);
+        /* set base, end pointer (all of memory) */
+        writel(0, chan_regs + HOST1X_CHANNEL_DMASTART);
+        writel(0xFFFFFFFF, chan_regs + HOST1X_CHANNEL_DMAEND);
+        /* set GET, by loading the value in PUT (then reset GET) */
+        writel(getptr, chan_regs + HOST1X_CHANNEL_DMAPUT);
+        writel(host1x_channel_dmactrl(true, true, true),
+                chan_regs + HOST1X_CHANNEL_DMACTRL);
+        dev_dbg(&dev->dev->dev,
+                "%s: DMA GET 0x%x, PUT HW 0x%x / shadow 0x%x\n",
+                __func__,
+                readl(chan_regs + HOST1X_CHANNEL_DMAGET),
+                readl(chan_regs + HOST1X_CHANNEL_DMAPUT),
+                cdma->last_put);
+        /* deassert GET reset and set PUT */
+        writel(host1x_channel_dmactrl(true, false, false),
+                chan_regs + HOST1X_CHANNEL_DMACTRL);
+        writel(cdma->last_put, chan_regs + HOST1X_CHANNEL_DMAPUT);
+        /* start the command DMA */
+        writel(host1x_channel_dmactrl(false, false, false),
+                chan_regs + HOST1X_CHANNEL_DMACTRL);
+        cdma->running = true;
+}
+/**
+ * Kick channel DMA into action by writing its PUT offset (if it has changed)
+ */
+static void cdma_kick(struct nvhost_cdma *cdma)
+{
+        u32 put;
+        BUG_ON(!cdma_pb_op(cdma).putptr);
+        put = cdma_pb_op(cdma).putptr(&cdma->push_buffer);
+        if (put != cdma->last_put) {
+                void __iomem *chan_regs = cdma_to_channel(cdma)->aperture;
+                wmb();
+                writel(put, chan_regs + HOST1X_CHANNEL_DMAPUT);
+                cdma->last_put = put;
+        }
+}
+static void cdma_stop(struct nvhost_cdma *cdma)
+{
+        void __iomem *chan_regs = cdma_to_channel(cdma)->aperture;
+        mutex_lock(&cdma->lock);
+        if (cdma->running) {
+                nvhost_cdma_wait_locked(cdma, CDMA_EVENT_SYNC_QUEUE_EMPTY);
+                writel(host1x_channel_dmactrl(true, false, false),
+                        chan_regs + HOST1X_CHANNEL_DMACTRL);
+                cdma->running = false;
+        }
+        mutex_unlock(&cdma->lock);
+}
+/**
+ * Retrieve the op pair at a slot offset from a DMA address
+ */
+void cdma_peek(struct nvhost_cdma *cdma,
+                          u32 dmaget, int slot, u32 *out)
+{
+        u32 offset = dmaget - cdma->push_buffer.phys;
+        u32 *p = cdma->push_buffer.mapped;
+        offset = ((offset + slot * 8) & (PUSH_BUFFER_SIZE - 1)) >> 2;
+        out[0] = p[offset];
+        out[1] = p[offset + 1];
+}
+/**
+ * Stops both channel's command processor and CDMA immediately.
+ * Also, tears down the channel and resets corresponding module.
+ */
+void cdma_timeout_teardown_begin(struct nvhost_cdma *cdma)
+{
+        struct nvhost_master *dev = cdma_to_dev(cdma);
+        struct nvhost_channel *ch = cdma_to_channel(cdma);
+        u32 cmdproc_stop;
+        BUG_ON(cdma->torndown);
+        dev_dbg(&dev->dev->dev,
+                "begin channel teardown (channel id %d)\n", ch->chid);
+        cmdproc_stop = readl(dev->sync_aperture + HOST1X_SYNC_CMDPROC_STOP);
+        cmdproc_stop |= BIT(ch->chid);
+        writel(cmdproc_stop, dev->sync_aperture + HOST1X_SYNC_CMDPROC_STOP);
+        dev_dbg(&dev->dev->dev,
+                "%s: DMA GET 0x%x, PUT HW 0x%x / shadow 0x%x\n",
+                __func__,
+                readl(ch->aperture + HOST1X_CHANNEL_DMAGET),
+                readl(ch->aperture + HOST1X_CHANNEL_DMAPUT),
+                cdma->last_put);
+        writel(host1x_channel_dmactrl(true, false, false),
+                ch->aperture + HOST1X_CHANNEL_DMACTRL);
+        writel(BIT(ch->chid), dev->sync_aperture + HOST1X_SYNC_CH_TEARDOWN);
+        nvhost_module_reset(ch->dev);
+        cdma->running = false;
+        cdma->torndown = true;
+}
+void cdma_timeout_teardown_end(struct nvhost_cdma *cdma, u32 getptr)
+{
+        struct nvhost_master *dev = cdma_to_dev(cdma);
+        struct nvhost_channel *ch = cdma_to_channel(cdma);
+        u32 cmdproc_stop;
+        BUG_ON(!cdma->torndown || cdma->running);
+        dev_dbg(&dev->dev->dev,
+                "end channel teardown (id %d, DMAGET restart = 0x%x)\n",
+                ch->chid, getptr);
+        cmdproc_stop = readl(dev->sync_aperture + HOST1X_SYNC_CMDPROC_STOP);
+        cmdproc_stop &= ~(BIT(ch->chid));
+        writel(cmdproc_stop, dev->sync_aperture + HOST1X_SYNC_CMDPROC_STOP);
+        cdma->torndown = false;
+        cdma_timeout_restart(cdma, getptr);
+}
+/**
+ * If this timeout fires, it indicates the current sync_queue entry has
+ * exceeded its TTL and the userctx should be timed out and remaining
+ * submits already issued cleaned up (future submits return an error).
+ */
+static void cdma_timeout_handler(struct work_struct *work)
+{
+        struct nvhost_cdma *cdma;
+        struct nvhost_master *dev;
+        struct nvhost_syncpt *sp;
+        struct nvhost_channel *ch;
+        u32 syncpt_val;
+        u32 prev_cmdproc, cmdproc_stop;
+        cdma = container_of(to_delayed_work(work), struct nvhost_cdma,
+                            timeout.wq);
+        dev = cdma_to_dev(cdma);
+        sp = &dev->syncpt;
+        ch = cdma_to_channel(cdma);
+        mutex_lock(&cdma->lock);
+        if (!cdma->timeout.clientid) {
+                dev_dbg(&dev->dev->dev,
+                         "cdma_timeout: expired, but has no clientid\n");
+                mutex_unlock(&cdma->lock);
+                return;
+        }
+        /* stop processing to get a clean snapshot */
+        prev_cmdproc = readl(dev->sync_aperture + HOST1X_SYNC_CMDPROC_STOP);
+        cmdproc_stop = prev_cmdproc | BIT(ch->chid);
+        writel(cmdproc_stop, dev->sync_aperture + HOST1X_SYNC_CMDPROC_STOP);
+        dev_dbg(&dev->dev->dev, "cdma_timeout: cmdproc was 0x%x is 0x%x\n",
+                prev_cmdproc, cmdproc_stop);
+        syncpt_val = nvhost_syncpt_update_min(&dev->syncpt,
+                        cdma->timeout.syncpt_id);
+        /* has buffer actually completed? */
+        if ((s32)(syncpt_val - cdma->timeout.syncpt_val) >= 0) {
+                dev_dbg(&dev->dev->dev,
+                         "cdma_timeout: expired, but buffer had completed\n");
+                /* restore */
+                cmdproc_stop = prev_cmdproc & ~(BIT(ch->chid));
+                writel(cmdproc_stop,
+                        dev->sync_aperture + HOST1X_SYNC_CMDPROC_STOP);
+                mutex_unlock(&cdma->lock);
+                return;
+        }
+        dev_warn(&dev->dev->dev,
+                "%s: timeout: %d (%s) ctx 0x%p, HW thresh %d, done %d\n",
+                __func__,
+                cdma->timeout.syncpt_id,
+                syncpt_op(sp).name(sp, cdma->timeout.syncpt_id),
+                cdma->timeout.ctx,
+                syncpt_val, cdma->timeout.syncpt_val);
+        /* stop HW, resetting channel/module */
+        cdma_op(cdma).timeout_teardown_begin(cdma);
+        nvhost_cdma_update_sync_queue(cdma, sp, &dev->dev->dev);
+        mutex_unlock(&cdma->lock);
+}
+int host1x_init_cdma_support(struct nvhost_master *host)
+{
+        host->op.cdma.start = cdma_start;
+        host->op.cdma.stop = cdma_stop;
+        host->op.cdma.kick = cdma_kick;
+        host->op.cdma.timeout_init = cdma_timeout_init;
+        host->op.cdma.timeout_destroy = cdma_timeout_destroy;
+        host->op.cdma.timeout_teardown_begin = cdma_timeout_teardown_begin;
+        host->op.cdma.timeout_teardown_end = cdma_timeout_teardown_end;
+        host->op.cdma.timeout_cpu_incr = cdma_timeout_cpu_incr;
+        host->op.cdma.timeout_pb_incr = cdma_timeout_pb_incr;
+        host->op.push_buffer.reset = push_buffer_reset;
+        host->op.push_buffer.init = push_buffer_init;
+        host->op.push_buffer.destroy = push_buffer_destroy;
+        host->op.push_buffer.push_to = push_buffer_push_to;
+        host->op.push_buffer.pop_from = push_buffer_pop_from;
+        host->op.push_buffer.space = push_buffer_space;
+        host->op.push_buffer.putptr = push_buffer_putptr;
+        return 0;
+}
diff --git a/drivers/video/tegra/host/host1x/host1x_cdma.h b/drivers/video/tegra/host/host1x/host1x_cdma.h
new file mode 100644
index 00000000000..60909236a7c
--- /dev/null
+++ b/drivers/video/tegra/host/host1x/host1x_cdma.h
@@ -0,0 +1,41 @@
+/*
+ * drivers/video/tegra/host/host1x/host1x_cdma.h
+ *
+ * Tegra Graphics Host Channel
+ *
+ * Copyright (c) 2011-2012, NVIDIA Corporation.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+#ifndef __NVHOST_HOST1X_HOST1X_CDMA_H
+#define __NVHOST_HOST1X_HOST1X_CDMA_H
+/* Size of the sync queue. If it is too small, we won't be able to queue up
+ * many command buffers. If it is too large, we waste memory. */
+#define NVHOST_SYNC_QUEUE_SIZE 512
+/* Number of gathers we allow to be queued up per channel. Must be a
+ * power of two. Currently sized such that pushbuffer is 4KB (512*8B). */
+#define NVHOST_GATHER_QUEUE_SIZE 512
+/* 8 bytes per slot. (This number does not include the final RESTART.) */
+#define PUSH_BUFFER_SIZE (NVHOST_GATHER_QUEUE_SIZE * 8)
+/* 4K page containing GATHERed methods to increment channel syncpts
+ * and replaces the original timed out contexts GATHER slots */
+#define SYNCPT_INCR_BUFFER_SIZE_WORDS   (4096 / sizeof(u32))
+int host1x_init_cdma_support(struct nvhost_master *);
+#endif
diff --git a/drivers/video/tegra/host/host1x/host1x_channel.c b/drivers/video/tegra/host/host1x/host1x_channel.c
new file mode 100644
index 00000000000..b16a34f416a
--- /dev/null
+++ b/drivers/video/tegra/host/host1x/host1x_channel.c
@@ -0,0 +1,627 @@
+/*
+ * drivers/video/tegra/host/host1x/channel_host1x.c
+ *
+ * Tegra Graphics Host Channel
+ *
+ * Copyright (c) 2010-2012, NVIDIA Corporation.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+#include "nvhost_channel.h"
+#include "dev.h"
+#include "nvhost_hwctx.h"
+#include <trace/events/nvhost.h>
+#include <linux/slab.h>
+#include "host1x_syncpt.h"
+#include "host1x_channel.h"
+#include "host1x_hardware.h"
+#include "host1x_hwctx.h"
+#include "nvhost_intr.h"
+#define NV_FIFO_READ_TIMEOUT 200000
+static void sync_waitbases(struct nvhost_channel *ch, u32 syncpt_val)
+{
+        unsigned long waitbase;
+        unsigned long int waitbase_mask = ch->dev->waitbases;
+        if (ch->dev->waitbasesync) {
+                waitbase = find_first_bit(&waitbase_mask, BITS_PER_LONG);
+                nvhost_cdma_push(&ch->cdma,
+                        nvhost_opcode_setclass(NV_HOST1X_CLASS_ID,
+                                NV_CLASS_HOST_LOAD_SYNCPT_BASE,
+                                1),
+                                nvhost_class_host_load_syncpt_base(waitbase,
+                                                syncpt_val));
+        }
+}
+static void *pre_submit_ctxsave(struct nvhost_job *job,
+                struct nvhost_hwctx *cur_ctx)
+{
+        struct nvhost_channel *ch = job->ch;
+        void *ctxsave_waiter = NULL;
+        /* Is a save needed? */
+        if (!cur_ctx || ch->cur_ctx == job->hwctx)
+                return NULL;
+        if (cur_ctx->has_timedout) {
+                dev_dbg(&ch->dev->dev,
+                        "%s: skip save of timed out context (0x%p)\n",
+                        __func__, ch->cur_ctx);
+                return NULL;
+        }
+        /* Allocate save waiter if needed */
+        if (ch->ctxhandler->save_service) {
+                ctxsave_waiter = nvhost_intr_alloc_waiter();
+                if (!ctxsave_waiter)
+                        return ERR_PTR(-ENOMEM);
+        }
+        return ctxsave_waiter;
+}
+static void submit_ctxsave(struct nvhost_job *job, void *ctxsave_waiter,
+                struct nvhost_hwctx *cur_ctx)
+{
+        struct nvhost_master *host = nvhost_get_host(job->ch->dev);
+        struct nvhost_channel *ch = job->ch;
+        u32 syncval;
+        int err;
+        u32 save_thresh = 0;
+        /* Is a save needed? */
+        if (!cur_ctx || cur_ctx == job->hwctx || cur_ctx->has_timedout)
+                return;
+        /* Retrieve save threshold if we have a waiter */
+        if (ctxsave_waiter)
+                save_thresh =
+                        nvhost_syncpt_read_max(&host->syncpt, job->syncpt_id)
+                        + to_host1x_hwctx(cur_ctx)->save_thresh;
+        /* Adjust the syncpoint max */
+        job->syncpt_incrs += to_host1x_hwctx(cur_ctx)->save_incrs;
+        syncval = nvhost_syncpt_incr_max(&host->syncpt,
+                        job->syncpt_id,
+                        to_host1x_hwctx(cur_ctx)->save_incrs);
+        /* Send the save to channel */
+        cur_ctx->valid = true;
+        ch->ctxhandler->save_push(cur_ctx, &ch->cdma);
+        nvhost_job_get_hwctx(job, cur_ctx);
+        /* Notify save service */
+        if (ctxsave_waiter) {
+                err = nvhost_intr_add_action(&host->intr,
+                        job->syncpt_id,
+                        save_thresh,
+                        NVHOST_INTR_ACTION_CTXSAVE, cur_ctx,
+                        ctxsave_waiter,
+                        NULL);
+                ctxsave_waiter = NULL;
+                WARN(err, "Failed to set ctx save interrupt");
+        }
+        trace_nvhost_channel_context_save(ch->dev->name, cur_ctx);
+}
+static void submit_ctxrestore(struct nvhost_job *job)
+{
+        struct nvhost_master *host = nvhost_get_host(job->ch->dev);
+        struct nvhost_channel *ch = job->ch;
+        u32 syncval;
+        struct host1x_hwctx *ctx =
+                job->hwctx ? to_host1x_hwctx(job->hwctx) : NULL;
+        /* First check if we have a valid context to restore */
+        if(ch->cur_ctx == job->hwctx || !job->hwctx || !job->hwctx->valid)
+                return;
+        /* Increment syncpt max */
+        job->syncpt_incrs += ctx->restore_incrs;
+        syncval = nvhost_syncpt_incr_max(&host->syncpt,
+                        job->syncpt_id,
+                        ctx->restore_incrs);
+        /* Send restore buffer to channel */
+        nvhost_cdma_push_gather(&ch->cdma,
+                host->nvmap,
+                nvmap_ref_to_handle(ctx->restore),
+                nvhost_opcode_gather(ctx->restore_size),
+                ctx->restore_phys);
+        trace_nvhost_channel_context_restore(ch->dev->name, &ctx->hwctx);
+}
+void submit_nullkickoff(struct nvhost_job *job, int user_syncpt_incrs)
+{
+        struct nvhost_channel *ch = job->ch;
+        int incr;
+        u32 op_incr;
+        /* push increments that correspond to nulled out commands */
+        op_incr = nvhost_opcode_imm_incr_syncpt(NV_SYNCPT_OP_DONE,
+                        job->syncpt_id);
+        for (incr = 0; incr < (user_syncpt_incrs >> 1); incr++)
+                nvhost_cdma_push(&ch->cdma, op_incr, op_incr);
+        if (user_syncpt_incrs & 1)
+                nvhost_cdma_push(&ch->cdma, op_incr, NVHOST_OPCODE_NOOP);
+        /* for 3d, waitbase needs to be incremented after each submit */
+        if (ch->dev->class == NV_GRAPHICS_3D_CLASS_ID) {
+                u32 waitbase = to_host1x_hwctx_handler(job->hwctx->h)->waitbase;
+                nvhost_cdma_push(&ch->cdma,
+                        nvhost_opcode_setclass(
+                                NV_HOST1X_CLASS_ID,
+                                NV_CLASS_HOST_INCR_SYNCPT_BASE,
+                                1),
+                        nvhost_class_host_incr_syncpt_base(
+                                waitbase,
+                                user_syncpt_incrs));
+        }
+}
+void submit_gathers(struct nvhost_job *job)
+{
+        /* push user gathers */
+        int i = 0;
+        for ( ; i < job->num_gathers; i++) {
+                u32 op1 = nvhost_opcode_gather(job->gathers[i].words);
+                u32 op2 = job->gathers[i].mem;
+                nvhost_cdma_push_gather(&job->ch->cdma,
+                                job->nvmap, job->unpins[i/2],
+                                op1, op2);
+        }
+}
+int host1x_channel_submit(struct nvhost_job *job)
+{
+        struct nvhost_channel *ch = job->ch;
+        struct nvhost_syncpt *sp = &nvhost_get_host(job->ch->dev)->syncpt;
+        u32 user_syncpt_incrs = job->syncpt_incrs;
+        u32 prev_max = 0;
+        u32 syncval;
+        int err;
+        void *completed_waiter = NULL, *ctxsave_waiter = NULL;
+        /* Bail out on timed out contexts */
+        if (job->hwctx && job->hwctx->has_timedout)
+                return -ETIMEDOUT;
+        /* Turn on the client module and host1x */
+        nvhost_module_busy(ch->dev);
+        if (ch->dev->busy)
+                ch->dev->busy(ch->dev);
+        /* before error checks, return current max */
+        prev_max = job->syncpt_end =
+                nvhost_syncpt_read_max(sp, job->syncpt_id);
+        /* get submit lock */
+        err = mutex_lock_interruptible(&ch->submitlock);
+        if (err) {
+                nvhost_module_idle(ch->dev);
+                goto error;
+        }
+        /* Do the needed allocations */
+        ctxsave_waiter = pre_submit_ctxsave(job, ch->cur_ctx);
+        if (IS_ERR(ctxsave_waiter)) {
+                err = PTR_ERR(ctxsave_waiter);
+                nvhost_module_idle(ch->dev);
+                mutex_unlock(&ch->submitlock);
+                goto error;
+        }
+        completed_waiter = nvhost_intr_alloc_waiter();
+        if (!completed_waiter) {
+                nvhost_module_idle(ch->dev);
+                mutex_unlock(&ch->submitlock);
+                err = -ENOMEM;
+                goto error;
+        }
+        /* remove stale waits */
+        if (job->num_waitchk) {
+                err = nvhost_syncpt_wait_check(sp,
+                                               job->nvmap,
+                                               job->waitchk_mask,
+                                               job->waitchk,
+                                               job->num_waitchk);
+                if (err) {
+                        dev_warn(&ch->dev->dev,
+                                 "nvhost_syncpt_wait_check failed: %d\n", err);
+                        mutex_unlock(&ch->submitlock);
+                        nvhost_module_idle(ch->dev);
+                        goto error;
+                }
+        }
+        /* begin a CDMA submit */
+        err = nvhost_cdma_begin(&ch->cdma, job);
+        if (err) {
+                mutex_unlock(&ch->submitlock);
+                nvhost_module_idle(ch->dev);
+                goto error;
+        }
+        submit_ctxsave(job, ctxsave_waiter, ch->cur_ctx);
+        submit_ctxrestore(job);
+        ch->cur_ctx = job->hwctx;
+        syncval = nvhost_syncpt_incr_max(sp,
+                        job->syncpt_id, user_syncpt_incrs);
+        job->syncpt_end = syncval;
+        /* add a setclass for modules that require it */
+        if (ch->dev->class)
+                nvhost_cdma_push(&ch->cdma,
+                        nvhost_opcode_setclass(ch->dev->class, 0, 0),
+                        NVHOST_OPCODE_NOOP);
+        if (job->null_kickoff)
+                submit_nullkickoff(job, user_syncpt_incrs);
+        else
+                submit_gathers(job);
+        sync_waitbases(ch, job->syncpt_end);
+        /* end CDMA submit & stash pinned hMems into sync queue */
+        nvhost_cdma_end(&ch->cdma, job);
+        trace_nvhost_channel_submitted(ch->dev->name,
+                        prev_max, syncval);
+        /* schedule a submit complete interrupt */
+        err = nvhost_intr_add_action(&nvhost_get_host(ch->dev)->intr,
+                        job->syncpt_id, syncval,
+                        NVHOST_INTR_ACTION_SUBMIT_COMPLETE, ch,
+                        completed_waiter,
+                        NULL);
+        completed_waiter = NULL;
+        WARN(err, "Failed to set submit complete interrupt");
+        mutex_unlock(&ch->submitlock);
+        return 0;
+error:
+        kfree(ctxsave_waiter);
+        kfree(completed_waiter);
+        return err;
+}
+int host1x_channel_read_3d_reg(
+        struct nvhost_channel *channel,
+        struct nvhost_hwctx *hwctx,
+        u32 offset,
+        u32 *value)
+{
+        struct host1x_hwctx *hwctx_to_save = NULL;
+        struct nvhost_hwctx_handler *h = hwctx->h;
+        struct host1x_hwctx_handler *p = to_host1x_hwctx_handler(h);
+        bool need_restore = false;
+        u32 syncpt_incrs = 4;
+        unsigned int pending = 0;
+        DECLARE_WAIT_QUEUE_HEAD_ONSTACK(wq);
+        void *ref;
+        void *ctx_waiter, *read_waiter, *completed_waiter;
+        struct nvhost_job *job;
+        u32 syncval;
+        int err;
+        if (hwctx && hwctx->has_timedout)
+                return -ETIMEDOUT;
+        ctx_waiter = nvhost_intr_alloc_waiter();
+        read_waiter = nvhost_intr_alloc_waiter();
+        completed_waiter = nvhost_intr_alloc_waiter();
+        if (!ctx_waiter || !read_waiter || !completed_waiter) {
+                err = -ENOMEM;
+                goto done;
+        }
+        job = nvhost_job_alloc(channel, hwctx,
+                        NULL,
+                        nvhost_get_host(channel->dev)->nvmap, 0, 0);
+        if (!job) {
+                err = -ENOMEM;
+                goto done;
+        }
+        /* keep module powered */
+        nvhost_module_busy(channel->dev);
+        /* get submit lock */
+        err = mutex_lock_interruptible(&channel->submitlock);
+        if (err) {
+                nvhost_module_idle(channel->dev);
+                return err;
+        }
+        /* context switch */
+        if (channel->cur_ctx != hwctx) {
+                hwctx_to_save = channel->cur_ctx ?
+                        to_host1x_hwctx(channel->cur_ctx) : NULL;
+                if (hwctx_to_save) {
+                        syncpt_incrs += hwctx_to_save->save_incrs;
+                        hwctx_to_save->hwctx.valid = true;
+                        channel->ctxhandler->get(&hwctx_to_save->hwctx);
+                }
+                channel->cur_ctx = hwctx;
+                if (channel->cur_ctx && channel->cur_ctx->valid) {
+                        need_restore = true;
+                        syncpt_incrs += to_host1x_hwctx(channel->cur_ctx)
+                                ->restore_incrs;
+                }
+        }
+        syncval = nvhost_syncpt_incr_max(&nvhost_get_host(channel->dev)->syncpt,
+                p->syncpt, syncpt_incrs);
+        job->syncpt_id = p->syncpt;
+        job->syncpt_incrs = syncpt_incrs;
+        job->syncpt_end = syncval;
+        /* begin a CDMA submit */
+        nvhost_cdma_begin(&channel->cdma, job);
+        /* push save buffer (pre-gather setup depends on unit) */
+        if (hwctx_to_save)
+                h->save_push(&hwctx_to_save->hwctx, &channel->cdma);
+        /* gather restore buffer */
+        if (need_restore)
+                nvhost_cdma_push(&channel->cdma,
+                        nvhost_opcode_gather(to_host1x_hwctx(channel->cur_ctx)
+                                ->restore_size),
+                        to_host1x_hwctx(channel->cur_ctx)->restore_phys);
+        /* Switch to 3D - wait for it to complete what it was doing */
+        nvhost_cdma_push(&channel->cdma,
+                nvhost_opcode_setclass(NV_GRAPHICS_3D_CLASS_ID, 0, 0),
+                nvhost_opcode_imm_incr_syncpt(NV_SYNCPT_OP_DONE,
+                        p->syncpt));
+        nvhost_cdma_push(&channel->cdma,
+                nvhost_opcode_setclass(NV_HOST1X_CLASS_ID,
+                        NV_CLASS_HOST_WAIT_SYNCPT_BASE, 1),
+                nvhost_class_host_wait_syncpt_base(p->syncpt,
+                        p->waitbase, 1));
+        /*  Tell 3D to send register value to FIFO */
+        nvhost_cdma_push(&channel->cdma,
+                nvhost_opcode_nonincr(NV_CLASS_HOST_INDOFF, 1),
+                nvhost_class_host_indoff_reg_read(NV_HOST_MODULE_GR3D,
+                        offset, false));
+        nvhost_cdma_push(&channel->cdma,
+                nvhost_opcode_imm(NV_CLASS_HOST_INDDATA, 0),
+                NVHOST_OPCODE_NOOP);
+        /*  Increment syncpt to indicate that FIFO can be read */
+        nvhost_cdma_push(&channel->cdma,
+                nvhost_opcode_imm_incr_syncpt(NV_SYNCPT_IMMEDIATE,
+                        p->syncpt),
+                NVHOST_OPCODE_NOOP);
+        /*  Wait for value to be read from FIFO */
+        nvhost_cdma_push(&channel->cdma,
+                nvhost_opcode_nonincr(NV_CLASS_HOST_WAIT_SYNCPT_BASE, 1),
+                nvhost_class_host_wait_syncpt_base(p->syncpt,
+                        p->waitbase, 3));
+        /*  Indicate submit complete */
+        nvhost_cdma_push(&channel->cdma,
+                nvhost_opcode_nonincr(NV_CLASS_HOST_INCR_SYNCPT_BASE, 1),
+                nvhost_class_host_incr_syncpt_base(p->waitbase, 4));
+        nvhost_cdma_push(&channel->cdma,
+                NVHOST_OPCODE_NOOP,
+                nvhost_opcode_imm_incr_syncpt(NV_SYNCPT_IMMEDIATE,
+                        p->syncpt));
+        /* end CDMA submit  */
+        nvhost_cdma_end(&channel->cdma, job);
+        nvhost_job_put(job);
+        job = NULL;
+        /*
+         * schedule a context save interrupt (to drain the host FIFO
+         * if necessary, and to release the restore buffer)
+         */
+        if (hwctx_to_save) {
+                err = nvhost_intr_add_action(
+                        &nvhost_get_host(channel->dev)->intr,
+                        p->syncpt,
+                        syncval - syncpt_incrs
+                                + hwctx_to_save->save_incrs
+                                - 1,
+                        NVHOST_INTR_ACTION_CTXSAVE, hwctx_to_save,
+                        ctx_waiter,
+                        NULL);
+                ctx_waiter = NULL;
+                WARN(err, "Failed to set context save interrupt");
+        }
+        /* Wait for FIFO to be ready */
+        err = nvhost_intr_add_action(&nvhost_get_host(channel->dev)->intr,
+                        p->syncpt, syncval - 2,
+                        NVHOST_INTR_ACTION_WAKEUP, &wq,
+                        read_waiter,
+                        &ref);
+        read_waiter = NULL;
+        WARN(err, "Failed to set wakeup interrupt");
+        wait_event(wq,
+                nvhost_syncpt_is_expired(&nvhost_get_host(channel->dev)->syncpt,
+                                p->syncpt, syncval - 2));
+        nvhost_intr_put_ref(&nvhost_get_host(channel->dev)->intr, ref);
+        /* Read the register value from FIFO */
+        err = host1x_drain_read_fifo(channel->aperture,
+                value, 1, &pending);
+        /* Indicate we've read the value */
+        nvhost_syncpt_cpu_incr(&nvhost_get_host(channel->dev)->syncpt,
+                        p->syncpt);
+        /* Schedule a submit complete interrupt */
+        err = nvhost_intr_add_action(&nvhost_get_host(channel->dev)->intr,
+                        p->syncpt, syncval,
+                        NVHOST_INTR_ACTION_SUBMIT_COMPLETE, channel,
+                        completed_waiter, NULL);
+        completed_waiter = NULL;
+        WARN(err, "Failed to set submit complete interrupt");
+        mutex_unlock(&channel->submitlock);
+done:
+        kfree(ctx_waiter);
+        kfree(read_waiter);
+        kfree(completed_waiter);
+        return err;
+}
+int host1x_drain_read_fifo(void __iomem *chan_regs,
+        u32 *ptr, unsigned int count, unsigned int *pending)
+{
+        unsigned int entries = *pending;
+        unsigned long timeout = jiffies + NV_FIFO_READ_TIMEOUT;
+        while (count) {
+                unsigned int num;
+                while (!entries && time_before(jiffies, timeout)) {
+                        /* query host for number of entries in fifo */
+                        entries = HOST1X_VAL(CHANNEL_FIFOSTAT, OUTFENTRIES,
+                                readl(chan_regs + HOST1X_CHANNEL_FIFOSTAT));
+                        if (!entries)
+                                cpu_relax();
+                }
+                /*  timeout -> return error */
+                if (!entries)
+                        return -EIO;
+                num = min(entries, count);
+                entries -= num;
+                count -= num;
+                while (num & ~0x3) {
+                        u32 arr[4];
+                        arr[0] = readl(chan_regs + HOST1X_CHANNEL_INDDATA);
+                        arr[1] = readl(chan_regs + HOST1X_CHANNEL_INDDATA);
+                        arr[2] = readl(chan_regs + HOST1X_CHANNEL_INDDATA);
+                        arr[3] = readl(chan_regs + HOST1X_CHANNEL_INDDATA);
+                        memcpy(ptr, arr, 4*sizeof(u32));
+                        ptr += 4;
+                        num -= 4;
+                }
+                while (num--)
+                        *ptr++ = readl(chan_regs + HOST1X_CHANNEL_INDDATA);
+        }
+        *pending = entries;
+        return 0;
+}
+int host1x_save_context(struct nvhost_device *dev, u32 syncpt_id)
+{
+        struct nvhost_channel *ch = dev->channel;
+        struct nvhost_hwctx *hwctx_to_save;
+        DECLARE_WAIT_QUEUE_HEAD_ONSTACK(wq);
+        u32 syncpt_incrs, syncpt_val;
+        int err = 0;
+        void *ref;
+        void *ctx_waiter = NULL, *wakeup_waiter = NULL;
+        struct nvhost_job *job;
+        ctx_waiter = nvhost_intr_alloc_waiter();
+        wakeup_waiter = nvhost_intr_alloc_waiter();
+        if (!ctx_waiter || !wakeup_waiter) {
+                err = -ENOMEM;
+                goto done;
+        }
+        if (dev->busy)
+                dev->busy(dev);
+        mutex_lock(&ch->submitlock);
+        hwctx_to_save = ch->cur_ctx;
+        if (!hwctx_to_save) {
+                mutex_unlock(&ch->submitlock);
+                goto done;
+        }
+        job = nvhost_job_alloc(ch, hwctx_to_save,
+                        NULL,
+                        nvhost_get_host(ch->dev)->nvmap, 0, 0);
+        if (IS_ERR_OR_NULL(job)) {
+                err = PTR_ERR(job);
+                mutex_unlock(&ch->submitlock);
+                goto done;
+        }
+        hwctx_to_save->valid = true;
+        ch->ctxhandler->get(hwctx_to_save);
+        ch->cur_ctx = NULL;
+        syncpt_incrs = to_host1x_hwctx(hwctx_to_save)->save_incrs;
+        syncpt_val = nvhost_syncpt_incr_max(&nvhost_get_host(ch->dev)->syncpt,
+                                        syncpt_id, syncpt_incrs);
+        job->syncpt_id = syncpt_id;
+        job->syncpt_incrs = syncpt_incrs;
+        job->syncpt_end = syncpt_val;
+        err = nvhost_cdma_begin(&ch->cdma, job);
+        if (err) {
+                mutex_unlock(&ch->submitlock);
+                goto done;
+        }
+        ch->ctxhandler->save_push(hwctx_to_save, &ch->cdma);
+        nvhost_cdma_end(&ch->cdma, job);
+        nvhost_job_put(job);
+        job = NULL;
+        err = nvhost_intr_add_action(&nvhost_get_host(ch->dev)->intr, syncpt_id,
+                        syncpt_val - syncpt_incrs +
+                                to_host1x_hwctx(hwctx_to_save)->save_thresh,
+                        NVHOST_INTR_ACTION_CTXSAVE, hwctx_to_save,
+                        ctx_waiter,
+                        NULL);
+        ctx_waiter = NULL;
+        WARN(err, "Failed to set context save interrupt");
+        err = nvhost_intr_add_action(&nvhost_get_host(ch->dev)->intr,
+                        syncpt_id, syncpt_val,
+                        NVHOST_INTR_ACTION_WAKEUP, &wq,
+                        wakeup_waiter,
+                        &ref);
+        wakeup_waiter = NULL;
+        WARN(err, "Failed to set wakeup interrupt");
+        wait_event(wq,
+                nvhost_syncpt_is_expired(&nvhost_get_host(ch->dev)->syncpt,
+                                syncpt_id, syncpt_val));
+        nvhost_intr_put_ref(&nvhost_get_host(ch->dev)->intr, ref);
+        nvhost_cdma_update(&ch->cdma);
+        mutex_unlock(&ch->submitlock);
+done:
+        kfree(ctx_waiter);
+        kfree(wakeup_waiter);
+        return err;
+}
diff --git a/drivers/video/tegra/host/host1x/host1x_channel.h b/drivers/video/tegra/host/host1x/host1x_channel.h
new file mode 100644
index 00000000000..4113dbcada2
--- /dev/null
+++ b/drivers/video/tegra/host/host1x/host1x_channel.h
@@ -0,0 +1,45 @@
+/*
+ * drivers/video/tegra/host/host1x/host1x_channel.h
+ *
+ * Tegra Graphics Host Channel
+ *
+ * Copyright (c) 2011-2012, NVIDIA Corporation.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+#ifndef __NVHOST_HOST1X_CHANNEL_H
+#define __NVHOST_HOST1X_CHANNEL_H
+struct nvhost_job;
+struct nvhost_channel;
+struct nvhost_hwctx;
+struct nvhost_device;
+/*  Submit job to a host1x client */
+int host1x_channel_submit(struct nvhost_job *job);
+/*  Read 3d register via FIFO */
+int host1x_channel_read_3d_reg(
+        struct nvhost_channel *channel,
+        struct nvhost_hwctx *hwctx,
+        u32 offset,
+        u32 *value);
+/* Reads words from FIFO */
+int host1x_drain_read_fifo(void __iomem *chan_regs,
+                u32 *ptr, unsigned int count, unsigned int *pending);
+int host1x_save_context(struct nvhost_device *dev, u32 syncpt_id);
+#endif
diff --git a/drivers/video/tegra/host/host1x/host1x_debug.c b/drivers/video/tegra/host/host1x/host1x_debug.c
new file mode 100644
index 00000000000..1a1d764bbd6
--- /dev/null
+++ b/drivers/video/tegra/host/host1x/host1x_debug.c
@@ -0,0 +1,404 @@
+/*
+ * drivers/video/tegra/host/host1x/host1x_debug.c
+ *
+ * Copyright (C) 2010 Google, Inc.
+ * Author: Erik Gilling <konkers@android.com>
+ *
+ * Copyright (C) 2011 NVIDIA Corporation
+ *
+ * This software is licensed under the terms of the GNU General Public
+ * License version 2, as published by the Free Software Foundation, and
+ * may be copied, distributed, and modified under those terms.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ */
+#include <linux/debugfs.h>
+#include <linux/seq_file.h>
+#include <linux/mm.h>
+#include <linux/io.h>
+#include "dev.h"
+#include "debug.h"
+#include "nvhost_cdma.h"
+#include "../../nvmap/nvmap.h"
+#include "host1x_hardware.h"
+#include "host1x_cdma.h"
+#define NVHOST_DEBUG_MAX_PAGE_OFFSET 102400
+enum {
+        NVHOST_DBG_STATE_CMD = 0,
+        NVHOST_DBG_STATE_DATA = 1,
+        NVHOST_DBG_STATE_GATHER = 2
+};
+static int show_channel_command(struct output *o, u32 addr, u32 val, int *count)
+{
+        unsigned mask;
+        unsigned subop;
+        switch (val >> 28) {
+        case 0x0:
+                mask = val & 0x3f;
+                if (mask) {
+                        nvhost_debug_output(o,
+                                "SETCL(class=%03x, offset=%03x, mask=%02x, [",
+                                val >> 6 & 0x3ff, val >> 16 & 0xfff, mask);
+                        *count = hweight8(mask);
+                        return NVHOST_DBG_STATE_DATA;
+                } else {
+                        nvhost_debug_output(o, "SETCL(class=%03x)\n",
+                                val >> 6 & 0x3ff);
+                        return NVHOST_DBG_STATE_CMD;
+                }
+        case 0x1:
+                nvhost_debug_output(o, "INCR(offset=%03x, [",
+                        val >> 16 & 0xfff);
+                *count = val & 0xffff;
+                return NVHOST_DBG_STATE_DATA;
+        case 0x2:
+                nvhost_debug_output(o, "NONINCR(offset=%03x, [",
+                        val >> 16 & 0xfff);
+                *count = val & 0xffff;
+                return NVHOST_DBG_STATE_DATA;
+        case 0x3:
+                mask = val & 0xffff;
+                nvhost_debug_output(o, "MASK(offset=%03x, mask=%03x, [",
+                           val >> 16 & 0xfff, mask);
+                *count = hweight16(mask);
+                return NVHOST_DBG_STATE_DATA;
+        case 0x4:
+                nvhost_debug_output(o, "IMM(offset=%03x, data=%03x)\n",
+                           val >> 16 & 0xfff, val & 0xffff);
+                return NVHOST_DBG_STATE_CMD;
+        case 0x5:
+                nvhost_debug_output(o, "RESTART(offset=%08x)\n", val << 4);
+                return NVHOST_DBG_STATE_CMD;
+        case 0x6:
+                nvhost_debug_output(o, "GATHER(offset=%03x, insert=%d, type=%d, count=%04x, addr=[",
+                        val >> 16 & 0xfff, val >> 15 & 0x1, val >> 14 & 0x1,
+                        val & 0x3fff);
+                *count = val & 0x3fff; /* TODO: insert */
+                return NVHOST_DBG_STATE_GATHER;
+        case 0xe:
+                subop = val >> 24 & 0xf;
+                if (subop == 0)
+                        nvhost_debug_output(o, "ACQUIRE_MLOCK(index=%d)\n",
+                                val & 0xff);
+                else if (subop == 1)
+                        nvhost_debug_output(o, "RELEASE_MLOCK(index=%d)\n",
+                                val & 0xff);
+                else
+                        nvhost_debug_output(o, "EXTEND_UNKNOWN(%08x)\n", val);
+                return NVHOST_DBG_STATE_CMD;
+        default:
+                return NVHOST_DBG_STATE_CMD;
+        }
+}
+static void show_channel_gather(struct output *o, u32 addr,
+                phys_addr_t phys_addr, u32 words, struct nvhost_cdma *cdma);
+static void show_channel_word(struct output *o, int *state, int *count,
+                u32 addr, u32 val, struct nvhost_cdma *cdma)
+{
+        static int start_count, dont_print;
+        switch (*state) {
+        case NVHOST_DBG_STATE_CMD:
+                if (addr)
+                        nvhost_debug_output(o, "%08x: %08x:", addr, val);
+                else
+                        nvhost_debug_output(o, "%08x:", val);
+                *state = show_channel_command(o, addr, val, count);
+                dont_print = 0;
+                start_count = *count;
+                if (*state == NVHOST_DBG_STATE_DATA && *count == 0) {
+                        *state = NVHOST_DBG_STATE_CMD;
+                        nvhost_debug_output(o, "])\n");
+                }
+                break;
+        case NVHOST_DBG_STATE_DATA:
+                (*count)--;
+                if (start_count - *count < 64)
+                        nvhost_debug_output(o, "%08x%s",
+                                val, *count > 0 ? ", " : "])\n");
+                else if (!dont_print && (*count > 0)) {
+                        nvhost_debug_output(o, "[truncated; %d more words]\n",
+                                *count);
+                        dont_print = 1;
+                }
+                if (*count == 0)
+                        *state = NVHOST_DBG_STATE_CMD;
+                break;
+        case NVHOST_DBG_STATE_GATHER:
+                *state = NVHOST_DBG_STATE_CMD;
+                nvhost_debug_output(o, "%08x]):\n", val);
+                if (cdma) {
+                        show_channel_gather(o, addr, val,
+                                        *count, cdma);
+                }
+                break;
+        }
+}
+static void show_channel_gather(struct output *o, u32 addr,
+                phys_addr_t phys_addr,
+                u32 words, struct nvhost_cdma *cdma)
+{
+#if defined(CONFIG_TEGRA_NVMAP)
+        /* Map dmaget cursor to corresponding nvmap_handle */
+        struct push_buffer *pb = &cdma->push_buffer;
+        u32 cur = addr - pb->phys;
+        struct nvmap_client_handle *nvmap = &pb->nvmap[cur/8];
+        struct nvmap_handle_ref ref;
+        u32 *map_addr, offset;
+        phys_addr_t pin_addr;
+        int state, count, i;
+        if ((u32)nvmap->handle == NVHOST_CDMA_PUSH_GATHER_CTXSAVE) {
+                nvhost_debug_output(o, "[context save]\n");
+                return;
+        }
+        if (!nvmap->handle || !nvmap->client
+                        || atomic_read(&nvmap->handle->ref) < 1) {
+                nvhost_debug_output(o, "[already deallocated]\n");
+                return;
+        }
+        /* Create a fake nvmap_handle_ref - nvmap requires it
+         * but accesses only the first field - nvmap_handle */
+        ref.handle = nvmap->handle;
+        map_addr = nvmap_mmap(&ref);
+        if (!map_addr) {
+                nvhost_debug_output(o, "[could not mmap]\n");
+                return;
+        }
+        /* Get base address from nvmap */
+        pin_addr = nvmap_pin(nvmap->client, &ref);
+        if (IS_ERR_VALUE(pin_addr)) {
+                nvhost_debug_output(o, "[couldn't pin]\n");
+                nvmap_munmap(&ref, map_addr);
+                return;
+        }
+        offset = phys_addr - pin_addr;
+        /*
+         * Sometimes we're given different hardware address to the same
+         * page - in these cases the offset will get an invalid number and
+         * we just have to bail out.
+         */
+        if (offset > NVHOST_DEBUG_MAX_PAGE_OFFSET) {
+                nvhost_debug_output(o, "[address mismatch]\n");
+        } else {
+                /* GATHER buffer starts always with commands */
+                state = NVHOST_DBG_STATE_CMD;
+                for (i = 0; i < words; i++)
+                        show_channel_word(o, &state, &count,
+                                        phys_addr + i * 4,
+                                        *(map_addr + offset/4 + i),
+                                        cdma);
+        }
+        nvmap_unpin(nvmap->client, &ref);
+        nvmap_munmap(&ref, map_addr);
+#endif
+}
+static void show_channel_pair(struct output *o, u32 addr,
+                u32 w0, u32 w1, struct nvhost_cdma *cdma)
+{
+        int state = NVHOST_DBG_STATE_CMD;
+        int count;
+        show_channel_word(o, &state, &count, addr, w0, cdma);
+        show_channel_word(o, &state, &count, addr+4, w1, cdma);
+}
+/**
+ * Retrieve the op pair at a slot offset from a DMA address
+ */
+static void cdma_peek(struct nvhost_cdma *cdma,
+                      u32 dmaget, int slot, u32 *out)
+{
+        u32 offset = dmaget - cdma->push_buffer.phys;
+        u32 *p = cdma->push_buffer.mapped;
+        offset = ((offset + slot * 8) & (PUSH_BUFFER_SIZE - 1)) >> 2;
+        out[0] = p[offset];
+        out[1] = p[offset + 1];
+}
+u32 previous_oppair(struct nvhost_cdma *cdma, u32 cur)
+{
+        u32 pb = cdma->push_buffer.phys;
+        u32 prev = cur-8;
+        if (prev < pb)
+                prev += PUSH_BUFFER_SIZE;
+        return prev;
+}
+static void t20_debug_show_channel_cdma(struct nvhost_master *m,
+        struct nvhost_channel *ch, struct output *o, int chid)
+{
+        struct nvhost_channel *channel = ch;
+        struct nvhost_cdma *cdma = &channel->cdma;
+        u32 dmaput, dmaget, dmactrl;
+        u32 cbstat, cbread;
+        u32 val, base, baseval;
+        u32 pbw[2];
+        dmaput = readl(channel->aperture + HOST1X_CHANNEL_DMAPUT);
+        dmaget = readl(channel->aperture + HOST1X_CHANNEL_DMAGET);
+        dmactrl = readl(channel->aperture + HOST1X_CHANNEL_DMACTRL);
+        cbread = readl(m->sync_aperture + HOST1X_SYNC_CBREAD_x(chid));
+        cbstat = readl(m->sync_aperture + HOST1X_SYNC_CBSTAT_x(chid));
+        nvhost_debug_output(o, "%d-%s (%d): ", chid,
+                            channel->dev->name,
+                            channel->dev->refcount);
+        if (HOST1X_VAL(CHANNEL_DMACTRL, DMASTOP, dmactrl)
+                || !channel->cdma.push_buffer.mapped) {
+                nvhost_debug_output(o, "inactive\n\n");
+                return;
+        }
+        switch (cbstat) {
+        case 0x00010008:
+                nvhost_debug_output(o, "waiting on syncpt %d val %d\n",
+                        cbread >> 24, cbread & 0xffffff);
+                break;
+        case 0x00010009:
+                base = (cbread >> 16) & 0xff;
+                val = readl(m->sync_aperture +
+                                HOST1X_SYNC_SYNCPT_BASE_x(base));
+                baseval = HOST1X_VAL(SYNC_SYNCPT_BASE_0, BASE, val);
+                val = cbread & 0xffff;
+                nvhost_debug_output(o, "waiting on syncpt %d val %d "
+                          "(base %d = %d; offset = %d)\n",
+                        cbread >> 24, baseval + val,
+                        base, baseval, val);
+                break;
+        default:
+                nvhost_debug_output(o,
+                                "active class %02x, offset %04x, val %08x\n",
+                                HOST1X_VAL(SYNC_CBSTAT_0, CBCLASS0, cbstat),
+                                HOST1X_VAL(SYNC_CBSTAT_0, CBOFFSET0, cbstat),
+                                cbread);
+                break;
+        }
+        nvhost_debug_output(o, "DMAPUT %08x, DMAGET %08x, DMACTL %08x\n",
+                dmaput, dmaget, dmactrl);
+        nvhost_debug_output(o, "CBREAD %08x, CBSTAT %08x\n", cbread, cbstat);
+        cdma_peek(cdma, dmaget, -1, pbw);
+        show_channel_pair(o, previous_oppair(cdma, dmaget),
+                pbw[0], pbw[1], &channel->cdma);
+        nvhost_debug_output(o, "\n");
+}
+void t20_debug_show_channel_fifo(struct nvhost_master *m,
+        struct nvhost_channel *ch, struct output *o, int chid)
+{
+        u32 val, rd_ptr, wr_ptr, start, end;
+        struct nvhost_channel *channel = ch;
+        int state, count;
+        nvhost_debug_output(o, "%d: fifo:\n", chid);
+        val = readl(channel->aperture + HOST1X_CHANNEL_FIFOSTAT);
+        nvhost_debug_output(o, "FIFOSTAT %08x\n", val);
+        if (HOST1X_VAL(CHANNEL_FIFOSTAT, CFEMPTY, val)) {
+                nvhost_debug_output(o, "[empty]\n");
+                return;
+        }
+        writel(0x0, m->sync_aperture + HOST1X_SYNC_CFPEEK_CTRL);
+        writel(HOST1X_CREATE(SYNC_CFPEEK_CTRL, ENA, 1)
+                        | HOST1X_CREATE(SYNC_CFPEEK_CTRL, CHANNR, chid),
+                m->sync_aperture + HOST1X_SYNC_CFPEEK_CTRL);
+        val = readl(m->sync_aperture + HOST1X_SYNC_CFPEEK_PTRS);
+        rd_ptr = HOST1X_VAL(SYNC_CFPEEK_PTRS, CF_RD_PTR, val);
+        wr_ptr = HOST1X_VAL(SYNC_CFPEEK_PTRS, CF_WR_PTR, val);
+        val = readl(m->sync_aperture + HOST1X_SYNC_CFx_SETUP(chid));
+        start = HOST1X_VAL(SYNC_CF0_SETUP, BASE, val);
+        end = HOST1X_VAL(SYNC_CF0_SETUP, LIMIT, val);
+        state = NVHOST_DBG_STATE_CMD;
+        do {
+                writel(0x0, m->sync_aperture + HOST1X_SYNC_CFPEEK_CTRL);
+                writel(HOST1X_CREATE(SYNC_CFPEEK_CTRL, ENA, 1)
+                                | HOST1X_CREATE(SYNC_CFPEEK_CTRL, CHANNR, chid)
+                                | HOST1X_CREATE(SYNC_CFPEEK_CTRL, ADDR, rd_ptr),
+                        m->sync_aperture + HOST1X_SYNC_CFPEEK_CTRL);
+                val = readl(m->sync_aperture + HOST1X_SYNC_CFPEEK_READ);
+                show_channel_word(o, &state, &count, 0, val, NULL);
+                if (rd_ptr == end)
+                        rd_ptr = start;
+                else
+                        rd_ptr++;
+        } while (rd_ptr != wr_ptr);
+        if (state == NVHOST_DBG_STATE_DATA)
+                nvhost_debug_output(o, ", ...])\n");
+        nvhost_debug_output(o, "\n");
+        writel(0x0, m->sync_aperture + HOST1X_SYNC_CFPEEK_CTRL);
+}
+static void t20_debug_show_mlocks(struct nvhost_master *m, struct output *o)
+{
+        u32 __iomem *mlo_regs = m->sync_aperture + HOST1X_SYNC_MLOCK_OWNER_0;
+        int i;
+        nvhost_debug_output(o, "---- mlocks ----\n");
+        for (i = 0; i < NV_HOST1X_NB_MLOCKS; i++) {
+                u32 owner = readl(mlo_regs + i);
+                if (HOST1X_VAL(SYNC_MLOCK_OWNER_0, CH_OWNS, owner))
+                        nvhost_debug_output(o, "%d: locked by channel %d\n",
+                                i, HOST1X_VAL(SYNC_MLOCK_OWNER_0, CHID, owner));
+                else if (HOST1X_VAL(SYNC_MLOCK_OWNER_0, CPU_OWNS, owner))
+                        nvhost_debug_output(o, "%d: locked by cpu\n", i);
+                else
+                        nvhost_debug_output(o, "%d: unlocked\n", i);
+        }
+        nvhost_debug_output(o, "\n");
+}
+int nvhost_init_t20_debug_support(struct nvhost_master *host)
+{
+        host->op.debug.show_channel_cdma = t20_debug_show_channel_cdma;
+        host->op.debug.show_channel_fifo = t20_debug_show_channel_fifo;
+        host->op.debug.show_mlocks = t20_debug_show_mlocks;
+        return 0;
+}
diff --git a/drivers/video/tegra/host/host1x/host1x_hardware.h b/drivers/video/tegra/host/host1x/host1x_hardware.h
new file mode 100644
index 00000000000..d13d5752364
--- /dev/null
+++ b/drivers/video/tegra/host/host1x/host1x_hardware.h
@@ -0,0 +1,274 @@
+/*
+ * drivers/video/tegra/host/host1x/host1x_hardware.h
+ *
+ * Tegra Graphics Host Register Offsets
+ *
+ * Copyright (c) 2010-2012 NVIDIA Corporation.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+#ifndef __NVHOST_HOST1X_HOST1X_HARDWARE_H
+#define __NVHOST_HOST1X_HOST1X_HARDWARE_H
+#include <linux/types.h>
+#include <linux/bitops.h>
+/* class ids */
+enum {
+        NV_HOST1X_CLASS_ID = 0x1,
+        NV_VIDEO_ENCODE_MPEG_CLASS_ID = 0x20,
+        NV_GRAPHICS_3D_CLASS_ID = 0x60
+};
+/* channel registers */
+#define NV_HOST1X_CHANNELS 8
+#define NV_HOST1X_CHANNEL0_BASE 0
+#define NV_HOST1X_CHANNEL_MAP_SIZE_BYTES 16384
+#define NV_HOST1X_SYNC_MLOCK_NUM 16
+#define HOST1X_VAL(reg, field, regdata) \
+        ((regdata >> HOST1X_##reg##_##field##_SHIFT) \
+                        & HOST1X_##reg##_##field##_MASK)
+#define HOST1X_CREATE(reg, field, data) \
+        ((data & HOST1X_##reg##_##field##_MASK) \
+                        << HOST1X_##reg##_##field##_SHIFT) \
+#define HOST1X_CHANNEL_FIFOSTAT         0x00
+#define HOST1X_CHANNEL_FIFOSTAT_CFEMPTY_SHIFT 10
+#define HOST1X_CHANNEL_FIFOSTAT_CFEMPTY_MASK 0x1
+#define HOST1X_CHANNEL_FIFOSTAT_OUTFENTRIES_SHIFT 24
+#define HOST1X_CHANNEL_FIFOSTAT_OUTFENTRIES_MASK 0x1f
+#define HOST1X_CHANNEL_INDDATA          0x0c
+#define HOST1X_CHANNEL_DMASTART         0x14
+#define HOST1X_CHANNEL_DMAPUT           0x18
+#define HOST1X_CHANNEL_DMAGET           0x1c
+#define HOST1X_CHANNEL_DMAEND           0x20
+#define HOST1X_CHANNEL_DMACTRL          0x24
+#define HOST1X_CHANNEL_DMACTRL_DMASTOP_SHIFT 0
+#define HOST1X_CHANNEL_DMACTRL_DMASTOP_MASK 0x1
+#define HOST1X_CHANNEL_DMACTRL_DMAGETRST_SHIFT 1
+#define HOST1X_CHANNEL_DMACTRL_DMAGETRST_MASK 0x1
+#define HOST1X_CHANNEL_DMACTRL_DMAINITGET_SHIFT 2
+#define HOST1X_CHANNEL_DMACTRL_DMAINITGET_MASK 0x1
+#define HOST1X_CHANNEL_SYNC_REG_BASE    0x3000
+#define HOST1X_SYNC_INTMASK             0x4
+#define HOST1X_SYNC_INTC0MASK           0x8
+#define HOST1X_SYNC_HINTSTATUS          0x20
+#define HOST1X_SYNC_HINTMASK            0x24
+#define HOST1X_SYNC_HINTSTATUS_EXT      0x28
+#define HOST1X_SYNC_HINTSTATUS_EXT_IP_READ_INT_SHIFT 30
+#define HOST1X_SYNC_HINTSTATUS_EXT_IP_READ_INT_MASK 0x1
+#define HOST1X_SYNC_HINTSTATUS_EXT_IP_WRITE_INT_SHIFT 31
+#define HOST1X_SYNC_HINTSTATUS_EXT_IP_WRITE_INT_MASK 0x1
+#define HOST1X_SYNC_HINTMASK_EXT        0x2c
+#define HOST1X_SYNC_SYNCPT_THRESH_CPU0_INT_STATUS 0x40
+#define HOST1X_SYNC_SYNCPT_THRESH_CPU1_INT_STATUS 0x48
+#define HOST1X_SYNC_SYNCPT_THRESH_INT_DISABLE 0x60
+#define HOST1X_SYNC_SYNCPT_THRESH_INT_ENABLE_CPU0 0x68
+#define HOST1X_SYNC_CF0_SETUP           0x80
+#define HOST1X_SYNC_CF0_SETUP_BASE_SHIFT 0
+#define HOST1X_SYNC_CF0_SETUP_BASE_MASK 0x1ff
+#define HOST1X_SYNC_CF0_SETUP_LIMIT_SHIFT 16
+#define HOST1X_SYNC_CF0_SETUP_LIMIT_MASK 0x1ff
+#define HOST1X_SYNC_CFx_SETUP(x)        (HOST1X_SYNC_CF0_SETUP + (4 * (x)))
+#define HOST1X_SYNC_CMDPROC_STOP        0xac
+#define HOST1X_SYNC_CH_TEARDOWN         0xb0
+#define HOST1X_SYNC_USEC_CLK            0x1a4
+#define HOST1X_SYNC_CTXSW_TIMEOUT_CFG   0x1a8
+#define HOST1X_SYNC_IP_BUSY_TIMEOUT     0x1bc
+#define HOST1X_SYNC_IP_READ_TIMEOUT_ADDR 0x1c0
+#define HOST1X_SYNC_IP_WRITE_TIMEOUT_ADDR 0x1c4
+#define HOST1X_SYNC_MLOCK_0             0x2c0
+#define HOST1X_SYNC_MLOCK_OWNER_0       0x340
+#define HOST1X_SYNC_MLOCK_OWNER_0_CHID_SHIFT 8
+#define HOST1X_SYNC_MLOCK_OWNER_0_CHID_MASK 0xf
+#define HOST1X_SYNC_MLOCK_OWNER_0_CPU_OWNS_SHIFT 1
+#define HOST1X_SYNC_MLOCK_OWNER_0_CPU_OWNS_MASK 0x1
+#define HOST1X_SYNC_MLOCK_OWNER_0_CH_OWNS_SHIFT 0
+#define HOST1X_SYNC_MLOCK_OWNER_0_CH_OWNS_MASK 0x1
+#define HOST1X_SYNC_SYNCPT_0            0x400
+#define HOST1X_SYNC_SYNCPT_INT_THRESH_0 0x500
+#define HOST1X_SYNC_SYNCPT_BASE_0       0x600
+#define HOST1X_SYNC_SYNCPT_BASE_0_BASE_SHIFT 0
+#define HOST1X_SYNC_SYNCPT_BASE_0_BASE_MASK 0xffff
+#define HOST1X_SYNC_SYNCPT_BASE_x(x)    (HOST1X_SYNC_SYNCPT_BASE_0 + (4 * (x)))
+#define HOST1X_SYNC_SYNCPT_CPU_INCR     0x700
+#define HOST1X_SYNC_CBREAD_0            0x720
+#define HOST1X_SYNC_CBREAD_x(x)         (HOST1X_SYNC_CBREAD_0 + (4 * (x)))
+#define HOST1X_SYNC_CFPEEK_CTRL         0x74c
+#define HOST1X_SYNC_CFPEEK_CTRL_ADDR_SHIFT 0
+#define HOST1X_SYNC_CFPEEK_CTRL_ADDR_MASK 0x1ff
+#define HOST1X_SYNC_CFPEEK_CTRL_CHANNR_SHIFT 16
+#define HOST1X_SYNC_CFPEEK_CTRL_CHANNR_MASK 0x7
+#define HOST1X_SYNC_CFPEEK_CTRL_ENA_SHIFT 31
+#define HOST1X_SYNC_CFPEEK_CTRL_ENA_MASK 0x1
+#define HOST1X_SYNC_CFPEEK_READ         0x750
+#define HOST1X_SYNC_CFPEEK_PTRS         0x754
+#define HOST1X_SYNC_CFPEEK_PTRS_CF_RD_PTR_SHIFT 0
+#define HOST1X_SYNC_CFPEEK_PTRS_CF_RD_PTR_MASK 0x1ff
+#define HOST1X_SYNC_CFPEEK_PTRS_CF_WR_PTR_SHIFT 16
+#define HOST1X_SYNC_CFPEEK_PTRS_CF_WR_PTR_MASK 0x1ff
+#define HOST1X_SYNC_CBSTAT_0            0x758
+#define HOST1X_SYNC_CBSTAT_0_CBOFFSET0_SHIFT 0
+#define HOST1X_SYNC_CBSTAT_0_CBOFFSET0_MASK 0xffff
+#define HOST1X_SYNC_CBSTAT_0_CBCLASS0_SHIFT 16
+#define HOST1X_SYNC_CBSTAT_0_CBCLASS0_MASK 0xffff
+#define HOST1X_SYNC_CBSTAT_x(x)         (HOST1X_SYNC_CBSTAT_0 + (4 * (x)))
+/* sync registers */
+#define NV_HOST1X_SYNCPT_NB_PTS 32
+#define NV_HOST1X_SYNCPT_NB_BASES 8
+#define NV_HOST1X_NB_MLOCKS 16
+/* host class methods */
+enum {
+        NV_CLASS_HOST_INCR_SYNCPT = 0x0,
+        NV_CLASS_HOST_WAIT_SYNCPT = 0x8,
+        NV_CLASS_HOST_WAIT_SYNCPT_BASE = 0x9,
+        NV_CLASS_HOST_LOAD_SYNCPT_BASE = 0xb,
+        NV_CLASS_HOST_INCR_SYNCPT_BASE = 0xc,
+        NV_CLASS_HOST_INDOFF = 0x2d,
+        NV_CLASS_HOST_INDDATA = 0x2e
+};
+/*  sync point conditionals */
+enum {
+        NV_SYNCPT_IMMEDIATE = 0x0,
+        NV_SYNCPT_OP_DONE = 0x1,
+        NV_SYNCPT_RD_DONE = 0x2,
+        NV_SYNCPT_REG_WR_SAFE = 0x3,
+};
+static inline u32 nvhost_class_host_wait_syncpt(
+        unsigned indx, unsigned threshold)
+{
+        return (indx << 24) | (threshold & 0xffffff);
+}
+static inline u32 nvhost_class_host_load_syncpt_base(
+        unsigned indx, unsigned threshold)
+{
+        return (indx << 24) | (threshold & 0xffffff);
+}
+static inline u32 nvhost_class_host_wait_syncpt_base(
+        unsigned indx, unsigned base_indx, unsigned offset)
+{
+        return (indx << 24) | (base_indx << 16) | offset;
+}
+static inline u32 nvhost_class_host_incr_syncpt_base(
+        unsigned base_indx, unsigned offset)
+{
+        return (base_indx << 24) | offset;
+}
+static inline u32 nvhost_class_host_incr_syncpt(
+        unsigned cond, unsigned indx)
+{
+        return (cond << 8) | indx;
+}
+enum {
+        NV_HOST_MODULE_HOST1X = 0,
+        NV_HOST_MODULE_MPE = 1,
+        NV_HOST_MODULE_GR3D = 6
+};
+static inline u32 nvhost_class_host_indoff_reg_write(
+        unsigned mod_id, unsigned offset, bool auto_inc)
+{
+        u32 v = (0xf << 28) | (mod_id << 18) | (offset << 2);
+        if (auto_inc)
+                v |= BIT(27);
+        return v;
+}
+static inline u32 nvhost_class_host_indoff_reg_read(
+        unsigned mod_id, unsigned offset, bool auto_inc)
+{
+        u32 v = (mod_id << 18) | (offset << 2) | 1;
+        if (auto_inc)
+                v |= BIT(27);
+        return v;
+}
+/* cdma opcodes */
+static inline u32 nvhost_opcode_setclass(
+        unsigned class_id, unsigned offset, unsigned mask)
+{
+        return (0 << 28) | (offset << 16) | (class_id << 6) | mask;
+}
+static inline u32 nvhost_opcode_incr(unsigned offset, unsigned count)
+{
+        return (1 << 28) | (offset << 16) | count;
+}
+static inline u32 nvhost_opcode_nonincr(unsigned offset, unsigned count)
+{
+        return (2 << 28) | (offset << 16) | count;
+}
+static inline u32 nvhost_opcode_mask(unsigned offset, unsigned mask)
+{
+        return (3 << 28) | (offset << 16) | mask;
+}
+static inline u32 nvhost_opcode_imm(unsigned offset, unsigned value)
+{
+        return (4 << 28) | (offset << 16) | value;
+}
+static inline u32 nvhost_opcode_imm_incr_syncpt(unsigned cond, unsigned indx)
+{
+        return nvhost_opcode_imm(NV_CLASS_HOST_INCR_SYNCPT,
+                nvhost_class_host_incr_syncpt(cond, indx));
+}
+static inline u32 nvhost_opcode_restart(unsigned address)
+{
+        return (5 << 28) | (address >> 4);
+}
+static inline u32 nvhost_opcode_gather(unsigned count)
+{
+        return (6 << 28) | count;
+}
+static inline u32 nvhost_opcode_gather_nonincr(unsigned offset, unsigned count)
+{
+        return (6 << 28) | (offset << 16) | BIT(15) | count;
+}
+static inline u32 nvhost_opcode_gather_incr(unsigned offset, unsigned count)
+{
+        return (6 << 28) | (offset << 16) | BIT(15) | BIT(14) | count;
+}
+#define NVHOST_OPCODE_NOOP nvhost_opcode_nonincr(0, 0)
+static inline u32 nvhost_mask2(unsigned x, unsigned y)
+{
+        return 1 | (1 << (y - x));
+}
+#endif
diff --git a/drivers/video/tegra/host/host1x/host1x_hwctx.h b/drivers/video/tegra/host/host1x/host1x_hwctx.h
new file mode 100644
index 00000000000..7587642d0e1
--- /dev/null
+++ b/drivers/video/tegra/host/host1x/host1x_hwctx.h
@@ -0,0 +1,65 @@
+/*
+ * drivers/video/tegra/host/host1x/host1x_hwctx.h
+ *
+ * Tegra Graphics Host HOST1X Hardware Context Interface
+ *
+ * Copyright (c) 2012, NVIDIA Corporation.
+ *
+ * This program is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation; either version 2 of the License, or
+ * (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA.
+ */
+#ifndef __NVHOST_HOST1X_HWCTX_H
+#define __NVHOST_HOST1X_HWCTX_H
+#include <linux/kref.h>
+struct nvhost_hwctx_handler;
+struct nvhost_channel;
+#define to_host1x_hwctx_handler(handler) \
+        container_of((handler), struct host1x_hwctx_handler, h)
+#define to_host1x_hwctx(h) container_of((h), struct host1x_hwctx, hwctx)
+#define host1x_hwctx_handler(_hwctx) to_host1x_hwctx_handler((_hwctx)->hwctx.h)
+struct host1x_hwctx {
+        struct nvhost_hwctx hwctx;
+        u32 save_incrs;
+        u32 save_thresh;
+        u32 save_slots;
+        struct nvmap_handle_ref *restore;
+        u32 *restore_virt;
+        phys_addr_t restore_phys;
+        u32 restore_size;
+        u32 restore_incrs;
+};
+struct host1x_hwctx_handler {
+        struct nvhost_hwctx_handler h;
+        u32 syncpt;
+        u32 waitbase;
+        u32 restore_size;
+        u32 restore_incrs;
+        struct nvmap_handle_ref *save_buf;
+        u32 save_incrs;
+        u32 save_thresh;
+        u32 save_slots;
+        phys_addr_t save_phys;
+        u32 save_size;
+};
+#endif
diff --git a/drivers/video/tegra/host/host1x/host1x_intr.c b/drivers/video/tegra/host/host1x/host1x_intr.c
new file mode 100644
index 00000000000..47e984e2943
--- /dev/null
+++ b/drivers/video/tegra/host/host1x/host1x_intr.c
@@ -0,0 +1,218 @@
+/*
+ * drivers/video/tegra/host/host1x/host1x_intr.c
+ *
+ * Tegra Graphics Host Interrupt Management
+ *
+ * Copyright (c) 2010-2012, NVIDIA Corporation.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+#include <linux/interrupt.h>
+#include <linux/irq.h>
+#include "nvhost_intr.h"
+#include "dev.h"
+#include "host1x_hardware.h"
+/*** HW host sync management ***/
+static void t20_intr_init_host_sync(struct nvhost_intr *intr)
+{
+        struct nvhost_master *dev = intr_to_dev(intr);
+        void __iomem *sync_regs = dev->sync_aperture;
+        /* disable the ip_busy_timeout. this prevents write drops, etc.
+         * there's no real way to recover from a hung client anyway.
+         */
+        writel(0, sync_regs + HOST1X_SYNC_IP_BUSY_TIMEOUT);
+        /* increase the auto-ack timout to the maximum value. 2d will hang
+         * otherwise on ap20.
+         */
+        writel(0xff, sync_regs + HOST1X_SYNC_CTXSW_TIMEOUT_CFG);
+}
+static void t20_intr_set_host_clocks_per_usec(struct nvhost_intr *intr, u32 cpm)
+{
+        struct nvhost_master *dev = intr_to_dev(intr);
+        void __iomem *sync_regs = dev->sync_aperture;
+        /* write microsecond clock register */
+        writel(cpm, sync_regs + HOST1X_SYNC_USEC_CLK);
+}
+static void t20_intr_set_syncpt_threshold(struct nvhost_intr *intr,
+        u32 id, u32 thresh)
+{
+        struct nvhost_master *dev = intr_to_dev(intr);
+        void __iomem *sync_regs = dev->sync_aperture;
+        thresh &= 0xffff;
+        writel(thresh, sync_regs + (HOST1X_SYNC_SYNCPT_INT_THRESH_0 + id * 4));
+}
+static void t20_intr_enable_syncpt_intr(struct nvhost_intr *intr, u32 id)
+{
+        struct nvhost_master *dev = intr_to_dev(intr);
+        void __iomem *sync_regs = dev->sync_aperture;
+        writel(BIT(id), sync_regs + HOST1X_SYNC_SYNCPT_THRESH_INT_ENABLE_CPU0);
+}
+static void t20_intr_disable_all_syncpt_intrs(struct nvhost_intr *intr)
+{
+        struct nvhost_master *dev = intr_to_dev(intr);
+        void __iomem *sync_regs = dev->sync_aperture;
+        /* disable interrupts for both cpu's */
+        writel(0, sync_regs + HOST1X_SYNC_SYNCPT_THRESH_INT_DISABLE);
+        /* clear status for both cpu's */
+        writel(0xffffffffu, sync_regs +
+                HOST1X_SYNC_SYNCPT_THRESH_CPU0_INT_STATUS);
+        writel(0xffffffffu, sync_regs +
+                HOST1X_SYNC_SYNCPT_THRESH_CPU1_INT_STATUS);
+}
+/**
+ * Sync point threshold interrupt service function
+ * Handles sync point threshold triggers, in interrupt context
+ */
+irqreturn_t t20_intr_syncpt_thresh_isr(int irq, void *dev_id)
+{
+        struct nvhost_intr_syncpt *syncpt = dev_id;
+        unsigned int id = syncpt->id;
+        struct nvhost_intr *intr = intr_syncpt_to_intr(syncpt);
+        void __iomem *sync_regs = intr_to_dev(intr)->sync_aperture;
+        writel(BIT(id),
+                sync_regs + HOST1X_SYNC_SYNCPT_THRESH_INT_DISABLE);
+        writel(BIT(id),
+                sync_regs + HOST1X_SYNC_SYNCPT_THRESH_CPU0_INT_STATUS);
+        return IRQ_WAKE_THREAD;
+}
+/**
+ * Host general interrupt service function
+ * Handles read / write failures
+ */
+static irqreturn_t t20_intr_host1x_isr(int irq, void *dev_id)
+{
+        struct nvhost_intr *intr = dev_id;
+        void __iomem *sync_regs = intr_to_dev(intr)->sync_aperture;
+        u32 stat;
+        u32 ext_stat;
+        u32 addr;
+        stat = readl(sync_regs + HOST1X_SYNC_HINTSTATUS);
+        ext_stat = readl(sync_regs + HOST1X_SYNC_HINTSTATUS_EXT);
+        if (HOST1X_VAL(SYNC_HINTSTATUS_EXT, IP_READ_INT, ext_stat)) {
+                addr = readl(sync_regs + HOST1X_SYNC_IP_READ_TIMEOUT_ADDR);
+                pr_err("Host read timeout at address %x\n", addr);
+        }
+        if (HOST1X_VAL(SYNC_HINTSTATUS_EXT, IP_WRITE_INT, ext_stat)) {
+                addr = readl(sync_regs + HOST1X_SYNC_IP_WRITE_TIMEOUT_ADDR);
+                pr_err("Host write timeout at address %x\n", addr);
+        }
+        writel(ext_stat, sync_regs + HOST1X_SYNC_HINTSTATUS_EXT);
+        writel(stat, sync_regs + HOST1X_SYNC_HINTSTATUS);
+        return IRQ_HANDLED;
+}
+static int t20_intr_request_host_general_irq(struct nvhost_intr *intr)
+{
+        void __iomem *sync_regs = intr_to_dev(intr)->sync_aperture;
+        int err;
+        if (intr->host_general_irq_requested)
+                return 0;
+        /* master disable for general (not syncpt) host interrupts */
+        writel(0, sync_regs + HOST1X_SYNC_INTMASK);
+        /* clear status & extstatus */
+        writel(0xfffffffful, sync_regs + HOST1X_SYNC_HINTSTATUS_EXT);
+        writel(0xfffffffful, sync_regs + HOST1X_SYNC_HINTSTATUS);
+        err = request_irq(intr->host_general_irq, t20_intr_host1x_isr, 0,
+                        "host_status", intr);
+        if (err)
+                return err;
+        /* enable extra interrupt sources IP_READ_INT and IP_WRITE_INT */
+        writel(BIT(30) | BIT(31), sync_regs + HOST1X_SYNC_HINTMASK_EXT);
+        /* enable extra interrupt sources */
+        writel(BIT(31), sync_regs + HOST1X_SYNC_HINTMASK);
+        /* enable host module interrupt to CPU0 */
+        writel(BIT(0), sync_regs + HOST1X_SYNC_INTC0MASK);
+        /* master enable for general (not syncpt) host interrupts */
+        writel(BIT(0), sync_regs + HOST1X_SYNC_INTMASK);
+        intr->host_general_irq_requested = true;
+        return err;
+}
+static void t20_intr_free_host_general_irq(struct nvhost_intr *intr)
+{
+        if (intr->host_general_irq_requested) {
+                void __iomem *sync_regs = intr_to_dev(intr)->sync_aperture;
+                /* master disable for general (not syncpt) host interrupts */
+                writel(0, sync_regs + HOST1X_SYNC_INTMASK);
+                free_irq(intr->host_general_irq, intr);
+                intr->host_general_irq_requested = false;
+        }
+}
+static int t20_request_syncpt_irq(struct nvhost_intr_syncpt *syncpt)
+{
+        int err;
+        if (syncpt->irq_requested)
+                return 0;
+        err = request_threaded_irq(syncpt->irq,
+                                   t20_intr_syncpt_thresh_isr,
+                                   nvhost_syncpt_thresh_fn,
+                                   0, syncpt->thresh_irq_name, syncpt);
+        if (err)
+                return err;
+        syncpt->irq_requested = 1;
+        return 0;
+}
+int nvhost_init_t20_intr_support(struct nvhost_master *host)
+{
+        host->op.intr.init_host_sync = t20_intr_init_host_sync;
+        host->op.intr.set_host_clocks_per_usec =
+                t20_intr_set_host_clocks_per_usec;
+        host->op.intr.set_syncpt_threshold = t20_intr_set_syncpt_threshold;
+        host->op.intr.enable_syncpt_intr = t20_intr_enable_syncpt_intr;
+        host->op.intr.disable_all_syncpt_intrs =
+                t20_intr_disable_all_syncpt_intrs;
+        host->op.intr.request_host_general_irq =
+                t20_intr_request_host_general_irq;
+        host->op.intr.free_host_general_irq =
+                t20_intr_free_host_general_irq;
+        host->op.intr.request_syncpt_irq =
+                t20_request_syncpt_irq;
+        return 0;
+}
diff --git a/drivers/video/tegra/host/host1x/host1x_syncpt.c b/drivers/video/tegra/host/host1x/host1x_syncpt.c
new file mode 100644
index 00000000000..b0fd9970aaa
--- /dev/null
+++ b/drivers/video/tegra/host/host1x/host1x_syncpt.c
@@ -0,0 +1,248 @@
+/*
+ * drivers/video/tegra/host/host1x/host1x_syncpt.c
+ *
+ * Tegra Graphics Host Syncpoints for HOST1X
+ *
+ * Copyright (c) 2010-2012, NVIDIA Corporation.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+#include <linux/nvhost_ioctl.h>
+#include "nvhost_syncpt.h"
+#include "dev.h"
+#include "host1x_syncpt.h"
+#include "host1x_hardware.h"
+/**
+ * Write the current syncpoint value back to hw.
+ */
+static void t20_syncpt_reset(struct nvhost_syncpt *sp, u32 id)
+{
+        struct nvhost_master *dev = syncpt_to_dev(sp);
+        int min = nvhost_syncpt_read_min(sp, id);
+        writel(min, dev->sync_aperture + (HOST1X_SYNC_SYNCPT_0 + id * 4));
+}
+/**
+ * Write the current waitbase value back to hw.
+ */
+static void t20_syncpt_reset_wait_base(struct nvhost_syncpt *sp, u32 id)
+{
+        struct nvhost_master *dev = syncpt_to_dev(sp);
+        writel(sp->base_val[id],
+                dev->sync_aperture + (HOST1X_SYNC_SYNCPT_BASE_0 + id * 4));
+}
+/**
+ * Read waitbase value from hw.
+ */
+static void t20_syncpt_read_wait_base(struct nvhost_syncpt *sp, u32 id)
+{
+        struct nvhost_master *dev = syncpt_to_dev(sp);
+        sp->base_val[id] = readl(dev->sync_aperture +
+                                (HOST1X_SYNC_SYNCPT_BASE_0 + id * 4));
+}
+/**
+ * Updates the last value read from hardware.
+ * (was nvhost_syncpt_update_min)
+ */
+static u32 t20_syncpt_update_min(struct nvhost_syncpt *sp, u32 id)
+{
+        struct nvhost_master *dev = syncpt_to_dev(sp);
+        void __iomem *sync_regs = dev->sync_aperture;
+        u32 old, live;
+        do {
+                old = nvhost_syncpt_read_min(sp, id);
+                live = readl(sync_regs + (HOST1X_SYNC_SYNCPT_0 + id * 4));
+        } while ((u32)atomic_cmpxchg(&sp->min_val[id], old, live) != old);
+        if (!nvhost_syncpt_check_max(sp, id, live))
+                dev_err(&syncpt_to_dev(sp)->dev->dev,
+                                "%s failed: id=%u\n",
+                                __func__,
+                                id);
+        return live;
+}
+/**
+ * Write a cpu syncpoint increment to the hardware, without touching
+ * the cache. Caller is responsible for host being powered.
+ */
+static void t20_syncpt_cpu_incr(struct nvhost_syncpt *sp, u32 id)
+{
+        struct nvhost_master *dev = syncpt_to_dev(sp);
+        BUG_ON(!nvhost_module_powered(dev->dev));
+        if (!client_managed(id) && nvhost_syncpt_min_eq_max(sp, id)) {
+                dev_err(&syncpt_to_dev(sp)->dev->dev,
+                        "Trying to increment syncpoint id %d beyond max\n",
+                        id);
+                nvhost_debug_dump(syncpt_to_dev(sp));
+                return;
+        }
+        writel(BIT(id), dev->sync_aperture + HOST1X_SYNC_SYNCPT_CPU_INCR);
+        wmb();
+}
+/* check for old WAITs to be removed (avoiding a wrap) */
+static int t20_syncpt_wait_check(struct nvhost_syncpt *sp,
+                                 struct nvmap_client *nvmap,
+                                 u32 waitchk_mask,
+                                 struct nvhost_waitchk *wait,
+                                 int num_waitchk)
+{
+        u32 idx;
+        int err = 0;
+        /* get current syncpt values */
+        for (idx = 0; idx < NV_HOST1X_SYNCPT_NB_PTS; idx++) {
+                if (BIT(idx) & waitchk_mask)
+                        nvhost_syncpt_update_min(sp, idx);
+        }
+        BUG_ON(!wait && !num_waitchk);
+        /* compare syncpt vs wait threshold */
+        while (num_waitchk) {
+                u32 override;
+                BUG_ON(wait->syncpt_id >= NV_HOST1X_SYNCPT_NB_PTS);
+                if (nvhost_syncpt_is_expired(sp,
+                                        wait->syncpt_id, wait->thresh)) {
+                        /*
+                         * NULL an already satisfied WAIT_SYNCPT host method,
+                         * by patching its args in the command stream. The
+                         * method data is changed to reference a reserved
+                         * (never given out or incr) NVSYNCPT_GRAPHICS_HOST
+                         * syncpt with a matching threshold value of 0, so
+                         * is guaranteed to be popped by the host HW.
+                         */
+                        dev_dbg(&syncpt_to_dev(sp)->dev->dev,
+                            "drop WAIT id %d (%s) thresh 0x%x, min 0x%x\n",
+                            wait->syncpt_id,
+                            syncpt_op(sp).name(sp, wait->syncpt_id),
+                            wait->thresh,
+                            nvhost_syncpt_read_min(sp, wait->syncpt_id));
+                        /* patch the wait */
+                        override = nvhost_class_host_wait_syncpt(
+                                        NVSYNCPT_GRAPHICS_HOST, 0);
+                        err = nvmap_patch_word(nvmap,
+                                        (struct nvmap_handle *)wait->mem,
+                                        wait->offset, override);
+                        if (err)
+                                break;
+                }
+                wait++;
+                num_waitchk--;
+        }
+        return err;
+}
+static const char *s_syncpt_names[32] = {
+        "gfx_host",
+        "", "", "", "", "", "", "",
+        "disp0_a", "disp1_a", "avp_0",
+        "csi_vi_0", "csi_vi_1",
+        "vi_isp_0", "vi_isp_1", "vi_isp_2", "vi_isp_3", "vi_isp_4",
+        "2d_0", "2d_1",
+        "disp0_b", "disp1_b",
+        "3d",
+        "mpe",
+        "disp0_c", "disp1_c",
+        "vblank0", "vblank1",
+        "mpe_ebm_eof", "mpe_wr_safe",
+        "2d_tinyblt",
+        "dsi"
+};
+static const char *t20_syncpt_name(struct nvhost_syncpt *s, u32 id)
+{
+        BUG_ON(id >= ARRAY_SIZE(s_syncpt_names));
+        return s_syncpt_names[id];
+}
+static void t20_syncpt_debug(struct nvhost_syncpt *sp)
+{
+        u32 i;
+        for (i = 0; i < NV_HOST1X_SYNCPT_NB_PTS; i++) {
+                u32 max = nvhost_syncpt_read_max(sp, i);
+                u32 min = nvhost_syncpt_update_min(sp, i);
+                if (!max && !min)
+                        continue;
+                dev_info(&syncpt_to_dev(sp)->dev->dev,
+                        "id %d (%s) min %d max %d\n",
+                        i, syncpt_op(sp).name(sp, i),
+                        min, max);
+        }
+        for (i = 0; i < NV_HOST1X_SYNCPT_NB_BASES; i++) {
+                u32 base_val;
+                t20_syncpt_read_wait_base(sp, i);
+                base_val = sp->base_val[i];
+                if (base_val)
+                        dev_info(&syncpt_to_dev(sp)->dev->dev,
+                                        "waitbase id %d val %d\n",
+                                        i, base_val);
+        }
+}
+static int syncpt_mutex_try_lock(struct nvhost_syncpt *sp,
+                unsigned int idx)
+{
+        void __iomem *sync_regs = syncpt_to_dev(sp)->sync_aperture;
+        /* mlock registers returns 0 when the lock is aquired.
+         * writing 0 clears the lock. */
+        return !!readl(sync_regs + (HOST1X_SYNC_MLOCK_0 + idx * 4));
+}
+static void syncpt_mutex_unlock(struct nvhost_syncpt *sp,
+               unsigned int idx)
+{
+        void __iomem *sync_regs = syncpt_to_dev(sp)->sync_aperture;
+        writel(0, sync_regs + (HOST1X_SYNC_MLOCK_0 + idx * 4));
+}
+int host1x_init_syncpt_support(struct nvhost_master *host)
+{
+        host->sync_aperture = host->aperture +
+                (NV_HOST1X_CHANNEL0_BASE +
+                        HOST1X_CHANNEL_SYNC_REG_BASE);
+        host->op.syncpt.reset = t20_syncpt_reset;
+        host->op.syncpt.reset_wait_base = t20_syncpt_reset_wait_base;
+        host->op.syncpt.read_wait_base = t20_syncpt_read_wait_base;
+        host->op.syncpt.update_min = t20_syncpt_update_min;
+        host->op.syncpt.cpu_incr = t20_syncpt_cpu_incr;
+        host->op.syncpt.wait_check = t20_syncpt_wait_check;
+        host->op.syncpt.debug = t20_syncpt_debug;
+        host->op.syncpt.name = t20_syncpt_name;
+        host->op.syncpt.mutex_try_lock = syncpt_mutex_try_lock;
+        host->op.syncpt.mutex_unlock = syncpt_mutex_unlock;
+        host->syncpt.nb_pts = NV_HOST1X_SYNCPT_NB_PTS;
+        host->syncpt.nb_bases = NV_HOST1X_SYNCPT_NB_BASES;
+        host->syncpt.client_managed = NVSYNCPTS_CLIENT_MANAGED;
+        host->syncpt.nb_mlocks =  NV_HOST1X_SYNC_MLOCK_NUM;
+        return 0;
+}
diff --git a/drivers/video/tegra/host/host1x/host1x_syncpt.h b/drivers/video/tegra/host/host1x/host1x_syncpt.h
new file mode 100644
index 00000000000..0d263dc92ed
--- /dev/null
+++ b/drivers/video/tegra/host/host1x/host1x_syncpt.h
@@ -0,0 +1,77 @@
+/*
+ * drivers/video/tegra/host/host1x/host1x_syncpt.h
+ *
+ * Tegra Graphics Host Syncpoints for HOST1X
+ *
+ * Copyright (c) 2010-2012, NVIDIA Corporation.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+#ifndef __NVHOST_HOST1X_HOST1X_SYNCPT_H
+#define __NVHOST_HOST1X_HOST1X_SYNCPT_H
+#define NVSYNCPT_DISP0_A                     (8)
+#define NVSYNCPT_DISP1_A                     (9)
+#define NVSYNCPT_AVP_0                       (10)
+#define NVSYNCPT_CSI_VI_0                    (11)
+#define NVSYNCPT_CSI_VI_1                    (12)
+#define NVSYNCPT_VI_ISP_0                    (13)
+#define NVSYNCPT_VI_ISP_1                    (14)
+#define NVSYNCPT_VI_ISP_2                    (15)
+#define NVSYNCPT_VI_ISP_3                    (16)
+#define NVSYNCPT_VI_ISP_4                    (17)
+#define NVSYNCPT_2D_0                        (18)
+#define NVSYNCPT_2D_1                        (19)
+#define NVSYNCPT_DISP0_B                     (20)
+#define NVSYNCPT_DISP1_B                     (21)
+#define NVSYNCPT_3D                          (22)
+#define NVSYNCPT_MPE                         (23)
+#define NVSYNCPT_DISP0_C                     (24)
+#define NVSYNCPT_DISP1_C                     (25)
+#define NVSYNCPT_VBLANK0                     (26)
+#define NVSYNCPT_VBLANK1                     (27)
+#define NVSYNCPT_MPE_EBM_EOF                 (28)
+#define NVSYNCPT_MPE_WR_SAFE                 (29)
+#define NVSYNCPT_DSI                         (31)
+/*#define NVSYNCPT_2D_CHANNEL2_0    (20) */
+/*#define NVSYNCPT_2D_CHANNEL2_1    (21) */
+/*#define NVSYNCPT_2D_TINYBLT_WAR                    (30)*/
+/*#define NVSYNCPT_2D_TINYBLT_RESTORE_CLASS_ID (30)*/
+/* sync points that are wholly managed by the client */
+#define NVSYNCPTS_CLIENT_MANAGED ( \
+        BIT(NVSYNCPT_DISP0_A) | BIT(NVSYNCPT_DISP1_A) | \
+        BIT(NVSYNCPT_DISP0_B) | BIT(NVSYNCPT_DISP1_B) | \
+        BIT(NVSYNCPT_DISP0_C) | BIT(NVSYNCPT_DISP1_C) | \
+        BIT(NVSYNCPT_DSI) | \
+        BIT(NVSYNCPT_VBLANK0) | BIT(NVSYNCPT_VBLANK1) | \
+        BIT(NVSYNCPT_CSI_VI_0) | BIT(NVSYNCPT_CSI_VI_1) | \
+        BIT(NVSYNCPT_VI_ISP_1) | BIT(NVSYNCPT_VI_ISP_2) | \
+        BIT(NVSYNCPT_VI_ISP_3) | BIT(NVSYNCPT_VI_ISP_4) | \
+        BIT(NVSYNCPT_MPE_EBM_EOF) | BIT(NVSYNCPT_MPE_WR_SAFE) | \
+        BIT(NVSYNCPT_2D_1) | BIT(NVSYNCPT_AVP_0))
+#define NVWAITBASE_2D_0 (1)
+#define NVWAITBASE_2D_1 (2)
+#define NVWAITBASE_3D   (3)
+#define NVWAITBASE_MPE  (4)
+struct nvhost_master;
+int host1x_init_syncpt(struct nvhost_master *host);
+int host1x_init_syncpt_support(struct nvhost_master *host);
+#endif